{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 611,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "%matplotlib inline\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "import time\n",
    "import random\n",
    "from PIL import Image\n",
    "from PIL import ImageDraw\n",
    "plt.style.use({'figure.figsize':(10, 10)})\n",
    "pd.set_option('max_rows', 300)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 612,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "Epsilon_start=1\n",
    "Epsilon_final=0.01\n",
    "Decay_Rate=0.0000001\n",
    "Robot_radium=40 #the radius of hexapod robot\n",
    "Velocity_tripod=0.289*Robot_radium\n",
    "Velocity_quadruped=0.115*Robot_radium\n",
    "Velocity_onebyone=0.096*Robot_radium\n",
    "Up_degree=np.array([-40,-20,0,20,40])\n",
    "Left_degree=np.array([-60,-80,-100,-120])\n",
    "Right_degree=np.array([60,80,100,120]) #\n",
    "Beta=0.9\n",
    "Alpha=0.2"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "In the map, 'RGB' mode is used to reprensent different colors.\n",
    "\n",
    "(0,0,0)---Black---Obstacle and margin\n",
    "\n",
    "(255,255,255)---White---Flat ground\n",
    "\n",
    "(255,0,0)---Red---Destination\n",
    "\n",
    "(0,255,255)---Cyan---Hexapod robot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 613,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def Draw_map4(Destination_x,Destination_y):\n",
    "    im4=Image.new('RGB',size=(3000,3000),color=(0,0,0))\n",
    "    draw=ImageDraw.Draw(im4,mode='RGB')\n",
    "    draw.rectangle((40,40,2960,2960),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((500,800,1000,1200),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((500,800,800,1200),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((900,1300,1500,1800),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((2000,800,800,1200),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((500,250,800,500),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((2500,200,2700,1000),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((1100,300,2000,700),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((2200,1550,2700,1850),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((300,2000,1000,2700),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((1900,1900,2800,2500),(128,138,135),(128,138,135))\n",
    "    draw.ellipse((Destination_x-20,Destination_y-20,Destination_x+20,Destination_y+20), (255,0,0),(255,0,0))\n",
    "    return im4\n",
    "\n",
    "def Draw_map4_2(Destination_x,Destination_y):\n",
    "    im4_2=Image.new('RGB',size=(3000,3000),color=(0,0,0))\n",
    "    draw=ImageDraw.Draw(im4_2,mode='RGB')\n",
    "    draw.rectangle((40,40,2960,2960),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((500,800,1200,1200),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((200,300,1500,700),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((1800,300,2500,700),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((2000,1200,2700,1900),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((300,1600,1000,2700),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((1600,2100,2500,2700),(202,235,216),(202,235,216))\n",
    "    draw.ellipse((Destination_x-20,Destination_y-20,Destination_x+20,Destination_y+20), (255,0,0),(255,0,0))\n",
    "    return im4_2\n",
    "# im4_2=Draw_map4_2(1750,500)\n",
    "# plt.imshow(im4_2)\n",
    "# plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 614,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def Draw_map5(Destination_x,Destination_y):\n",
    "    im5=Image.new('RGB',size=(3000,3000),color=(0,0,0))\n",
    "    draw=ImageDraw.Draw(im5,mode='RGB')\n",
    "    draw.rectangle((40,40,2960,2960),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((500,800,1000,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((500,800,800,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((900,1300,1500,1800),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((2000,800,800,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((500,250,800,500),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((2500,200,2700,1000),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((1100,300,2000,700),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((2200,1550,2700,1850),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((300,2000,1000,2700),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((1900,1900,2800,2500),(128,138,135),(128,138,135))\n",
    "    draw.ellipse((Destination_x-20,Destination_y-20,Destination_x+20,Destination_y+20), (255,0,0),(255,0,0))\n",
    "    return im5\n",
    "\n",
    "def Draw_map5_2(Destination_x,Destination_y):\n",
    "    im5_2=Image.new('RGB',size=(3000,3000),color=(0,0,0))\n",
    "    draw=ImageDraw.Draw(im5_2,mode='RGB')\n",
    "    draw.rectangle((40,40,2960,2960),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((500,800,1200,1200),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((200,300,1500,700),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((1800,300,2500,700),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((2000,1200,2700,1900),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((300,1600,1000,2700),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((1600,2100,2500,2700),(255,255,255),(255,255,255))\n",
    "    draw.ellipse((Destination_x-20,Destination_y-20,Destination_x+20,Destination_y+20), (255,0,0),(255,0,0))\n",
    "    return im5_2\n",
    "# im5_2=Draw_map5_2(1750,500)\n",
    "# plt.imshow(im5_2)\n",
    "# plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 615,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def Draw_map6_2(Destination_x,Destination_y):\n",
    "    im6_2=Image.new('RGB',size=(3000,3000),color=(0,0,0))\n",
    "    draw=ImageDraw.Draw(im6_2,mode='RGB')\n",
    "    draw.rectangle((40,40,2960,2960),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((500,800,1200,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((200,300,1500,700),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((1800,300,2500,700),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((2000,1200,2700,1900),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((300,1600,1000,2700),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((1600,2100,2500,2700),(255,255,255),(255,255,255))\n",
    "    draw.ellipse((Destination_x-20,Destination_y-20,Destination_x+20,Destination_y+20), (255,0,0),(255,0,0))\n",
    "    return im6_2\n",
    "def Draw_map6(Destination_x,Destination_y):\n",
    "    im6=Image.new('RGB',size=(3000,3000),color=(0,0,0))\n",
    "    draw=ImageDraw.Draw(im6,mode='RGB')\n",
    "    draw.rectangle((40,40,2960,2960),(128,138,135),(128,138,135))\n",
    "    draw.rectangle((500,800,1000,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((500,800,800,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((900,1300,1500,1800),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((2000,800,800,1200),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((500,250,800,500),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((2500,200,2700,1000),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((1100,300,2000,700),(202,235,216),(202,235,216))\n",
    "    draw.rectangle((2200,1550,2700,1850),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((300,2000,1000,2700),(255,255,255),(255,255,255))\n",
    "    draw.rectangle((1900,1900,2800,2500),(202,235,216),(202,235,216))\n",
    "    draw.ellipse((Destination_x-20,Destination_y-20,Destination_x+20,Destination_y+20), (255,0,0),(255,0,0))\n",
    "    return im6\n",
    "# im6_2=Draw_map6_2(1750,500)\n",
    "# plt.imshow(im6_2)\n",
    "# plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 616,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "States=np.array(['L60D0/30/H0','L180D0/30/H0','L250D0/30/H0','L300D0/30/H0',\n",
    "'L60D30/60/H0','L180D30/60/H0','L250D30/60/H0','L300D30/60/H0',\n",
    "'L60D60/90/H0','L180D60/90/H0','L250D60/90/H0','L300D60/90/H0',\n",
    "'L60D90/120/H0','L180D90/120/H0','L250D90/120/H0','L300D90/120/H0',\n",
    "'L60D120/150/H0','L180D120/150/H0','L250D120/150/H0','L300D120/150/H0',\n",
    "'L60D150/180/H0','L180D150/180/H0','L250D150/180/H0','L300D150/180/H0',\n",
    "'L60D180/210/H0','L180D180/210/H0','L250D180/210/H0','L300D180/210/H0',\n",
    "'L60D210/240/H0','L180D210/240/H0','L250D210/240/H0','L300D210/240/H0',\n",
    "'L60D240/270/H0','L180D240/270/H0','L250D240/270/H0','L300D240/270/H0',\n",
    "'L60D270/300/H0','L180D270/300/H0','L250D270/300/H0','L300D270/300/H0',\n",
    "'L60D300/330/H0','L180D300/330/H0','L250D300/330/H0','L300D300/330/H0',\n",
    "'L60D330/360/H0','L180D330/360/H0','L250D330/360/H0','L300D330/360/H0',\n",
    "'L60D0/30/H1','L180D0/30/H1','L250D0/30/H1','L300D0/30/H1',\n",
    "'L60D30/60/H1','L180D30/60/H1','L250D30/60/H1','L300D30/60/H1',\n",
    "'L60D60/90/H1','L180D60/90/H1','L250D60/90/H1','L300D60/90/H1',\n",
    "'L60D90/120/H1','L180D90/120/H1','L250D90/120/H1','L300D90/120/H1',\n",
    "'L60D120/150/H1','L180D120/150/H1','L250D120/150/H1','L300D120/150/H1',\n",
    "'L60D150/180/H1','L180D150/180/H1','L250D150/180/H1','L300D150/180/H1',\n",
    "'L60D180/210/H1','L180D180/210/H1','L250D180/210/H1','L300D180/210/H1',\n",
    "'L60D210/240/H1','L180D210/240/H1','L250D210/240/H1','L300D210/240/H1',\n",
    "'L60D240/270/H1','L180D240/270/H1','L250D240/270/H1','L300D240/270/H1',\n",
    "'L60D270/300/H1','L180D270/300/H1','L250D270/300/H1','L300D270/300/H1',\n",
    "'L60D300/330/H1','L180D300/330/H1','L250D300/330/H1','L300D300/330/H1',\n",
    "'L60D330/360/H1','L180D330/360/H1','L250D330/360/H1','L300D330/360/H1',\n",
    "'L60D0/30/H2','L180D0/30/H2','L250D0/30/H2','L300D0/30/H2',\n",
    "'L60D30/60/H2','L180D30/60/H2','L250D30/60/H2','L300D30/60/H2',\n",
    "'L60D60/90/H2','L180D60/90/H2','L250D60/90/H2','L300D60/90/H2',\n",
    "'L60D90/120/H2','L180D90/120/H2','L250D90/120/H2','L300D90/120/H2',\n",
    "'L60D120/150/H2','L180D120/150/H2','L250D120/150/H2','L300D120/150/H2',\n",
    "'L60D150/180/H2','L180D150/180/H2','L250D150/180/H2','L300D150/180/H2',\n",
    "'L60D180/210/H2','L180D180/210/H2','L250D180/210/H2','L300D180/210/H2',\n",
    "'L60D210/240/H2','L180D210/240/H2','L250D210/240/H2','L300D210/240/H2',\n",
    "'L60D240/270/H2','L180D240/270/H2','L250D240/270/H2','L300D240/270/H2',\n",
    "'L60D270/300/H2','L180D270/300/H2','L250D270/300/H2','L300D270/300/H2',\n",
    "'L60D300/330/H2','L180D300/330/H2','L250D300/330/H2','L300D300/330/H2',\n",
    "'L60D330/360/H2','L180D330/360/H2','L250D330/360/H2','L300D330/360/H2'])\n",
    "Actions=np.array(['FrontH0','FrontH1','FrontH2','Left_45D','Right_45D'])\n",
    "Length_state=len(States)\n",
    "Length_action=len(Actions)\n",
    "Q_table=np.zeros((Length_state,Length_action))\n",
    "Q_table=pd.DataFrame(Q_table,columns=Actions,index=States)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 618,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def Initial_Q_Table(Length_action,Length_state):\n",
    "    Q_Table=np.zeros((Length_state,Length_action))\n",
    "    print('***********************************************************')\n",
    "    print(\"Succeed to initialize Q-Table!\")\n",
    "    print('***********************************************************')\n",
    "    return Q_Table\n",
    "\n",
    "def Set_destination(x_range,y_range):\n",
    "    x=np.random.randint(300,x_range-300)\n",
    "    y=np.random.randint(300,y_range-300)\n",
    "    return int(x),int(y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 626,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def Robot_destination(Destination_x,Destination_y,Robot_x,Robot_y,Robot_a):\n",
    "    Delta_x=Destination_x-Robot_x\n",
    "    Delta_y=Destination_y-Robot_y\n",
    "    Distance=np.sqrt(Delta_x*Delta_x+Delta_y*Delta_y)\n",
    "    Direct_angle=(np.arctan(Delta_y/Delta_x))*180/np.pi\n",
    "    if Delta_x<0:\n",
    "        Direct_angle=Direct_angle+180\n",
    "    True_angle=(Robot_a-Direct_angle)%360\n",
    "    if True_angle>180:\n",
    "        return 360-True_angle,'right',Distance\n",
    "    else:\n",
    "        return True_angle,'left',Distance\n",
    "\n",
    "def Is_Crash(Current_x,Current_y,im):\n",
    "    Crash=False\n",
    "    Degree=[-150,-120,-90,-60,-30,0,30,60,90,120,150,180]\n",
    "    Dis=np.arange(0,50,5)\n",
    "    for i in Dis:\n",
    "        for j in Degree:\n",
    "            x=Current_x+i*np.cos(j/180*np.pi)\n",
    "            y=Current_y+i*np.sin(j/180*np.pi)\n",
    "            if (im.getpixel((x,y)))==(0,0,0):\n",
    "                Crash=True\n",
    "                break\n",
    "        if Crash==True:\n",
    "                break\n",
    "    return Crash\n",
    "\n",
    "def Is_arrive(Current_x,Current_y,im):\n",
    "    Arrive=False\n",
    "    Crash=False\n",
    "    Degree=[-150,-120,-90,-60,-30,0,30,60,90,120,150,180]\n",
    "    Dis=np.arange(0,30,5)\n",
    "    for i in Dis:\n",
    "        for j in Degree:\n",
    "            x=Current_x+i*np.cos(j/180*np.pi)\n",
    "            y=Current_y+i*np.sin(j/180*np.pi)\n",
    "            if (im.getpixel((x,y)))==(0,0,0):\n",
    "                Crash=True\n",
    "                break\n",
    "            if (im.getpixel((x,y)))==(255,0,0):\n",
    "                Arrive=True\n",
    "                break\n",
    "        if Arrive==True or Crash==True:\n",
    "                break\n",
    "    return Arrive\n",
    "\n",
    "def Random_start(x_range,y_range,im):\n",
    "    a=np.random.random()*360\n",
    "    x=np.random.random()*x_range\n",
    "    y=np.random.random()*y_range\n",
    "    while(Is_Crash(x,y,im)==True or Is_arrive(x,y,im)==True):\n",
    "        x=np.random.random()*x_range\n",
    "        y=np.random.random()*y_range\n",
    "    return x,y,a\n",
    "\n",
    "def Height_level(Current_x,Current_y,Current_a,im):\n",
    "    Degree=[-30,0,30]\n",
    "    Distance=np.arange(0,30,5)\n",
    "    Max_height=0\n",
    "    for i in Degree:\n",
    "        for j in Distance:\n",
    "            x=Current_x+i*np.cos((j+Current_a)/180*np.pi)\n",
    "            y=Current_y+i*np.sin((j+Current_a)/180*np.pi)\n",
    "            Height_level=0\n",
    "            if im.getpixel((x,y))==(255,255,255):\n",
    "                Height_level=0\n",
    "            elif im.getpixel((x,y))==(202,235,216):\n",
    "                Height_level=1\n",
    "            elif im.getpixel((x,y))==(128,138,135):\n",
    "                Height_level=2\n",
    "            Max_height=max(Height_level,Max_height)\n",
    "            if Max_height==2:\n",
    "                break\n",
    "        if Max_height==2:\n",
    "            break\n",
    "    return Height_level\n",
    "\n",
    "def Output_state_index(True_angle,Left_right,Distance,Height):\n",
    "    if 0<=Distance<60:\n",
    "        Dis_level=0\n",
    "    elif 60<=Distance<180:\n",
    "        Dis_level=1\n",
    "    elif 180<=Distance<250:\n",
    "        Dis_level=2\n",
    "    else:\n",
    "        Dis_level=3\n",
    "    Angle_level=True_angle//30\n",
    "    if Left_right=='right':\n",
    "        Le_ri=1\n",
    "        State_number=int(Height*48+Dis_level+24*Le_ri+(5-Angle_level)*4)\n",
    "    elif Left_right=='left':\n",
    "        Le_ri=0\n",
    "        Angle_level=True_angle//30\n",
    "        State_number=int(Height*48+Dis_level+24*Le_ri+Angle_level*4)\n",
    "    return State_number,Dis_level,Angle_level\n",
    "\n",
    "def Choose_action(Q_Table,Current_state,Action_times):\n",
    "    Epsilon=Epsilon_final+(Epsilon_start-Epsilon_final)*np.exp(-1*Decay_Rate*Action_times)\n",
    "    State_action=Q_Table[Current_state,:]\n",
    "    if(np.random.random()<Epsilon or np.all(State_action==[0])):\n",
    "        Next_action=np.random.randint(Length_action)\n",
    "    else:\n",
    "        Next_action=np.argmax(State_action)\n",
    "    return Next_action\n",
    "\n",
    "def Next_state_F(Robot_x,Robot_y,Robot_a,Destination_x,Destination_y,Action,im):\n",
    "    Arrive=False\n",
    "    Crash=False\n",
    "    Current_height=Height_level(Robot_x,Robot_y,Robot_a,im)\n",
    "    if Action==0:\n",
    "        Robot_next_x=Robot_x+Velocity_tripod*np.cos(Robot_a/180*np.pi)\n",
    "        Robot_next_y=Robot_y+Velocity_tripod*np.sin(Robot_a/180*np.pi)\n",
    "        if Is_Crash(Robot_next_x,Robot_next_y,im)==True:\n",
    "            Crash=True\n",
    "        if Is_arrive(Robot_next_x,Robot_next_y,im)==True:\n",
    "            Arrive=True\n",
    "    elif Action==1:\n",
    "        Robot_next_x=Robot_x+Velocity_quadruped*np.cos(Robot_a/180*np.pi)\n",
    "        Robot_next_y=Robot_y+Velocity_quadruped*np.sin(Robot_a/180*np.pi)\n",
    "        if Is_Crash(Robot_next_x,Robot_next_y,im)==True:\n",
    "            Crash=True\n",
    "        if Is_arrive(Robot_next_x,Robot_next_y,im)==True:\n",
    "            Arrive=True\n",
    "    elif Action==2:\n",
    "        Robot_next_x=Robot_x+Velocity_onebyone*np.cos(Robot_a/180*np.pi)\n",
    "        Robot_next_y=Robot_y+Velocity_onebyone*np.sin(Robot_a/180*np.pi)\n",
    "        if Is_Crash(Robot_next_x,Robot_next_y,im)==True:\n",
    "            Crash=True\n",
    "        if Is_arrive(Robot_next_x,Robot_next_y,im)==True:\n",
    "            Arrive=True\n",
    "    elif Action==3:\n",
    "        Robot_a=Robot_a-60\n",
    "        Robot_next_x=Robot_x\n",
    "        Robot_next_y=Robot_y\n",
    "    elif Action==4:\n",
    "        Robot_a=Robot_a+60\n",
    "        Robot_next_x=Robot_x\n",
    "        Robot_next_y=Robot_y\n",
    "    Next_true_angle,Next_le_ri,Next_distance=Robot_destination(Destination_x,Destination_y,Robot_next_x,Robot_next_y,Robot_a)\n",
    "    Next_height=Height_level(Robot_next_x,Robot_next_y,Robot_a,im)\n",
    "    Next_state_number,Next_distance_level,Next_angle_level=Output_state_index(Next_true_angle,Next_le_ri,Next_distance,Next_height)  \n",
    "    if (Current_height==2 and Action==0) or (Current_height==2 and Action==1):\n",
    "        Reward=-10\n",
    "    elif(Current_height==1 and Action==0) or (Current_height==1 and Action==2):\n",
    "        Reward=-10\n",
    "    elif(Current_height==0 and Action==1) or (Current_height==0 and Action==2):\n",
    "        Reward=-10\n",
    "    else:\n",
    "        if Arrive==False:\n",
    "            Reward=(-Next_distance_level-Next_angle_level*0.5)*0.01\n",
    "        else:\n",
    "            Reward=10\n",
    "    return Robot_next_x,Robot_next_y,Robot_a,Reward,Next_state_number,Arrive,Crash"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 627,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "# Q_Table=Initial_Q_Table(Length_action,Length_state)\n",
    "global Epoche\n",
    "Epoche=0\n",
    "# global Action_times\n",
    "# Action_times=0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 628,
   "metadata": {
    "collapsed": true,
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "def Run_function():\n",
    "    global Epoche\n",
    "    Q_Table=Initial_Q_Table(Length_action,Length_state)\n",
    "#     global Action_times\n",
    "#     global Vector_x\n",
    "#     global Vector_y\n",
    "    Action_times=0\n",
    "    Crash_=False\n",
    "    Arrive_=False\n",
    "    Destination_x,Destination_y=Set_destination(3000,3000)\n",
    "    Choose_map=np.random.randint(6)\n",
    "    if Choose_map==0:\n",
    "        im=Draw_map4(Destination_x,Destination_y)\n",
    "    elif Choose_map==1:\n",
    "        im=Draw_map5(Destination_x,Destination_y)\n",
    "    elif Choose_map==2:\n",
    "        im=Draw_map6(Destination_x,Destination_y)\n",
    "    elif Choose_map==3:\n",
    "        im=Draw_map4_2(Destination_x,Destination_y)\n",
    "    elif Choose_map==4:\n",
    "        im=Draw_map5_2(Destination_x,Destination_y)\n",
    "    else:\n",
    "        im=Draw_map6_2(Destination_x,Destination_y)\n",
    "    Current_x,Current_y,Current_a=Random_start(3000,3000,im)\n",
    "    Epoche_false=0\n",
    "    while Epoche_false<3000:\n",
    "\n",
    "        True_a,Le_ri,Distance=Robot_destination(Destination_x,Destination_y,Current_x,Current_y,Current_a)\n",
    "        Height_level_=Height_level(Current_x,Current_y,Current_a,im)\n",
    "        Current_state_number,Distance_level,Angle_level=Output_state_index(True_a,Le_ri,Distance,Height_level_)\n",
    "        Next_action=Choose_action(Q_Table,Current_state_number,Action_times)\n",
    "        Next_x,Next_y,Next_a,Reward,Next_state_number,Arrive,Crash=Next_state_F(Current_x,Current_y,Current_a,Destination_x,Destination_y,Next_action,im)\n",
    "        if Crash==True:\n",
    "            Next_x,Next_y,Next_a=Random_start(3000,3000,im)\n",
    "        else:\n",
    "            if Arrive==True:\n",
    "#                 Next_true_a,Next_lr,Next_distance=Robot_destination(Destination_x,Destination_y,Next_x,Next_y,Next_a)\n",
    "#                 print('**********************************')\n",
    "#                 print('Destination_x=%f Destination_y=%f'%(Destination_x,Destination_y))\n",
    "#                 print('last_x=%f, last_y=%f,last_a=%f'%(Current_x,Current_y,Current_a%360))\n",
    "#                 print('Next_state_number=%d Reward=%f'%(Next_state_number,Reward))\n",
    "#                 print('Next_x=%f Next_y=%f True_angle=%f DestinationRobotDistance=%f Action=%d State=%s'%(Next_x,Next_y,Next_true_a,Next_distance,Next_action,States[Next_state_number]))\n",
    "#                 print('DestinationRobotAngle=%f Robot_current_angle=%d'%((np.arctan((Next_y-Destination_y)/(Next_x-Destination_x)))*180/np.pi,Next_a%360))\n",
    "                print('Epsilon=%f Action_times=%d Epoche=%d'%(Epsilon_final+(Epsilon_start-Epsilon_final)*np.exp(-1*Decay_Rate*Action_times),Action_times,Epoche))\n",
    "                Destination_x,Destination_y=Set_destination(3000,3000)\n",
    "                Choose_map=np.random.randint(6)\n",
    "                if Choose_map==0:\n",
    "                    im=Draw_map4(Destination_x,Destination_y)\n",
    "                elif Choose_map==1:\n",
    "                    im=Draw_map5(Destination_x,Destination_y)\n",
    "                elif Choose_map==2:\n",
    "                    im=Draw_map6(Destination_x,Destination_y)\n",
    "                elif Choose_map==3:\n",
    "                    im=Draw_map4_2(Destination_x,Destination_y)\n",
    "                elif Choose_map==4:\n",
    "                    im=Draw_map5_2(Destination_x,Destination_y)\n",
    "                else:\n",
    "                    im=Draw_map6_2(Destination_x,Destination_y)    \n",
    "                Next_x,Next_y,Next_a=Random_start(3000,3000,im)\n",
    "                Epoche_false+=1\n",
    "                Epoche+=1\n",
    "            Q_target=Reward+Beta*max(Q_Table[Next_state_number])\n",
    "            Q_Table[Current_state_number][Next_action]+=Alpha*(Q_target-Q_Table[Current_state_number][Next_action])\n",
    "        Current_x=Next_x\n",
    "        Current_y=Next_y         \n",
    "        Current_a=Next_a\n",
    "        Action_times+=1\n",
    "    return Q_Table\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 629,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0\n",
      "***********************************************************\n",
      "Succeed to initialize Q-Table!\n",
      "***********************************************************\n",
      "Epsilon=0.995412 Action_times=46449 Epoche=0\n",
      "Epsilon=0.994413 Action_times=56596 Epoche=1\n",
      "Epsilon=0.985813 Action_times=144338 Epoche=2\n",
      "Epsilon=0.984892 Action_times=153780 Epoche=3\n",
      "Epsilon=0.983770 Action_times=165301 Epoche=4\n",
      "Epsilon=0.983724 Action_times=165766 Epoche=5\n",
      "Epsilon=0.983319 Action_times=169932 Epoche=6\n",
      "Epsilon=0.982667 Action_times=176634 Epoche=7\n",
      "Epsilon=0.982332 Action_times=180080 Epoche=8\n",
      "Epsilon=0.980455 Action_times=199398 Epoche=9\n",
      "Epsilon=0.979937 Action_times=204743 Epoche=10\n",
      "Epsilon=0.978214 Action_times=222517 Epoche=11\n",
      "Epsilon=0.978000 Action_times=224733 Epoche=12\n",
      "Epsilon=0.977699 Action_times=227837 Epoche=13\n",
      "Epsilon=0.976728 Action_times=237876 Epoche=14\n",
      "Epsilon=0.976542 Action_times=239807 Epoche=15\n",
      "Epsilon=0.975728 Action_times=248232 Epoche=16\n",
      "Epsilon=0.974917 Action_times=256627 Epoche=17\n",
      "Epsilon=0.974258 Action_times=263465 Epoche=18\n",
      "Epsilon=0.973801 Action_times=268205 Epoche=19\n",
      "Epsilon=0.973016 Action_times=276344 Epoche=20\n",
      "Epsilon=0.972928 Action_times=277260 Epoche=21\n",
      "Epsilon=0.972389 Action_times=282860 Epoche=22\n",
      "Epsilon=0.970972 Action_times=297597 Epoche=23\n",
      "Epsilon=0.970917 Action_times=298164 Epoche=24\n",
      "Epsilon=0.970517 Action_times=302334 Epoche=25\n",
      "Epsilon=0.970283 Action_times=304767 Epoche=26\n",
      "Epsilon=0.969828 Action_times=309505 Epoche=27\n",
      "Epsilon=0.969351 Action_times=314478 Epoche=28\n",
      "Epsilon=0.968927 Action_times=318899 Epoche=29\n",
      "Epsilon=0.968050 Action_times=328053 Epoche=30\n",
      "Epsilon=0.968017 Action_times=328394 Epoche=31\n",
      "Epsilon=0.967734 Action_times=331351 Epoche=32\n",
      "Epsilon=0.967509 Action_times=333697 Epoche=33\n",
      "Epsilon=0.966917 Action_times=339878 Epoche=34\n",
      "Epsilon=0.966214 Action_times=347237 Epoche=35\n",
      "Epsilon=0.966085 Action_times=348585 Epoche=36\n",
      "Epsilon=0.965833 Action_times=351220 Epoche=37\n",
      "Epsilon=0.965283 Action_times=356972 Epoche=38\n",
      "Epsilon=0.964313 Action_times=367132 Epoche=39\n",
      "Epsilon=0.963981 Action_times=370609 Epoche=40\n",
      "Epsilon=0.963556 Action_times=375064 Epoche=41\n",
      "Epsilon=0.963317 Action_times=377573 Epoche=42\n",
      "Epsilon=0.963197 Action_times=378833 Epoche=43\n",
      "Epsilon=0.963048 Action_times=380393 Epoche=44\n",
      "Epsilon=0.962568 Action_times=385433 Epoche=45\n",
      "Epsilon=0.962516 Action_times=385981 Epoche=46\n",
      "Epsilon=0.961708 Action_times=394465 Epoche=47\n",
      "Epsilon=0.961435 Action_times=397333 Epoche=48\n",
      "Epsilon=0.961270 Action_times=399072 Epoche=49\n",
      "Epsilon=0.960915 Action_times=402798 Epoche=50\n",
      "Epsilon=0.960473 Action_times=407450 Epoche=51\n",
      "Epsilon=0.960168 Action_times=410657 Epoche=52\n",
      "Epsilon=0.960037 Action_times=412043 Epoche=53\n",
      "Epsilon=0.959807 Action_times=414461 Epoche=54\n",
      "Epsilon=0.959688 Action_times=415710 Epoche=55\n",
      "Epsilon=0.959111 Action_times=421787 Epoche=56\n",
      "Epsilon=0.958980 Action_times=423168 Epoche=57\n",
      "Epsilon=0.958700 Action_times=426124 Epoche=58\n",
      "Epsilon=0.958070 Action_times=432769 Epoche=59\n",
      "Epsilon=0.957794 Action_times=435673 Epoche=60\n",
      "Epsilon=0.957558 Action_times=438172 Epoche=61\n",
      "Epsilon=0.957090 Action_times=443109 Epoche=62\n",
      "Epsilon=0.956996 Action_times=444100 Epoche=63\n",
      "Epsilon=0.956671 Action_times=447534 Epoche=64\n",
      "Epsilon=0.956349 Action_times=450930 Epoche=65\n",
      "Epsilon=0.955960 Action_times=455047 Epoche=66\n",
      "Epsilon=0.955635 Action_times=458482 Epoche=67\n",
      "Epsilon=0.955293 Action_times=462101 Epoche=68\n",
      "Epsilon=0.954945 Action_times=465783 Epoche=69\n",
      "Epsilon=0.954558 Action_times=469877 Epoche=70\n",
      "Epsilon=0.954404 Action_times=471509 Epoche=71\n",
      "Epsilon=0.954012 Action_times=475659 Epoche=72\n",
      "Epsilon=0.953635 Action_times=479655 Epoche=73\n",
      "Epsilon=0.953583 Action_times=480208 Epoche=74\n",
      "Epsilon=0.953209 Action_times=484167 Epoche=75\n",
      "Epsilon=0.952936 Action_times=487061 Epoche=76\n",
      "Epsilon=0.952832 Action_times=488164 Epoche=77\n",
      "Epsilon=0.952435 Action_times=492377 Epoche=78\n",
      "Epsilon=0.952054 Action_times=496422 Epoche=79\n",
      "Epsilon=0.951771 Action_times=499423 Epoche=80\n",
      "Epsilon=0.951522 Action_times=502074 Epoche=81\n",
      "Epsilon=0.951490 Action_times=502417 Epoche=82\n",
      "Epsilon=0.951039 Action_times=507204 Epoche=83\n",
      "Epsilon=0.950932 Action_times=508343 Epoche=84\n",
      "Epsilon=0.950838 Action_times=509336 Epoche=85\n",
      "Epsilon=0.950518 Action_times=512744 Epoche=86\n",
      "Epsilon=0.950355 Action_times=514472 Epoche=87\n",
      "Epsilon=0.950142 Action_times=516735 Epoche=88\n",
      "Epsilon=0.949831 Action_times=520051 Epoche=89\n",
      "Epsilon=0.949538 Action_times=523170 Epoche=90\n",
      "Epsilon=0.949033 Action_times=528546 Epoche=91\n",
      "Epsilon=0.948778 Action_times=531257 Epoche=92\n",
      "Epsilon=0.948714 Action_times=531943 Epoche=93\n",
      "Epsilon=0.948469 Action_times=534553 Epoche=94\n",
      "Epsilon=0.948293 Action_times=536431 Epoche=95\n",
      "Epsilon=0.947648 Action_times=543308 Epoche=96\n",
      "Epsilon=0.947362 Action_times=546350 Epoche=97\n",
      "Epsilon=0.947208 Action_times=547993 Epoche=98\n",
      "Epsilon=0.946827 Action_times=552062 Epoche=99\n",
      "Epsilon=0.946472 Action_times=555849 Epoche=100\n",
      "Epsilon=0.946368 Action_times=556965 Epoche=101\n",
      "Epsilon=0.946296 Action_times=557734 Epoche=102\n",
      "Epsilon=0.946109 Action_times=559731 Epoche=103\n",
      "Epsilon=0.945882 Action_times=562152 Epoche=104\n",
      "Epsilon=0.945484 Action_times=566412 Epoche=105\n",
      "Epsilon=0.944726 Action_times=574512 Epoche=106\n",
      "Epsilon=0.944654 Action_times=575284 Epoche=107\n",
      "Epsilon=0.944426 Action_times=577720 Epoche=108\n",
      "Epsilon=0.944026 Action_times=582011 Epoche=109\n",
      "Epsilon=0.943855 Action_times=583842 Epoche=110\n",
      "Epsilon=0.943554 Action_times=587066 Epoche=111\n",
      "Epsilon=0.943328 Action_times=589485 Epoche=112\n",
      "Epsilon=0.943176 Action_times=591114 Epoche=113\n",
      "Epsilon=0.942875 Action_times=594339 Epoche=114\n",
      "Epsilon=0.942672 Action_times=596512 Epoche=115\n",
      "Epsilon=0.942518 Action_times=598170 Epoche=116\n",
      "Epsilon=0.942282 Action_times=600696 Epoche=117\n",
      "Epsilon=0.941898 Action_times=604818 Epoche=118\n",
      "Epsilon=0.941633 Action_times=607665 Epoche=119\n",
      "Epsilon=0.941334 Action_times=610871 Epoche=120\n",
      "Epsilon=0.941083 Action_times=613563 Epoche=121\n",
      "Epsilon=0.941052 Action_times=613893 Epoche=122\n",
      "Epsilon=0.940808 Action_times=616523 Epoche=123\n",
      "Epsilon=0.940490 Action_times=619934 Epoche=124\n",
      "Epsilon=0.940302 Action_times=621954 Epoche=125\n",
      "Epsilon=0.940029 Action_times=624888 Epoche=126\n",
      "Epsilon=0.939755 Action_times=627835 Epoche=127\n",
      "Epsilon=0.939436 Action_times=631274 Epoche=128\n",
      "Epsilon=0.939393 Action_times=631736 Epoche=129\n",
      "Epsilon=0.939315 Action_times=632569 Epoche=130\n",
      "Epsilon=0.939148 Action_times=634372 Epoche=131\n",
      "Epsilon=0.938603 Action_times=640234 Epoche=132\n",
      "Epsilon=0.938304 Action_times=643461 Epoche=133\n",
      "Epsilon=0.938134 Action_times=645289 Epoche=134\n",
      "Epsilon=0.938078 Action_times=645892 Epoche=135\n",
      "Epsilon=0.937671 Action_times=650278 Epoche=136\n",
      "Epsilon=0.937337 Action_times=653878 Epoche=137\n",
      "Epsilon=0.936970 Action_times=657842 Epoche=138\n",
      "Epsilon=0.936741 Action_times=660303 Epoche=139\n",
      "Epsilon=0.936504 Action_times=662865 Epoche=140\n",
      "Epsilon=0.936115 Action_times=667062 Epoche=141\n",
      "Epsilon=0.935947 Action_times=668878 Epoche=142\n",
      "Epsilon=0.935815 Action_times=670306 Epoche=143\n",
      "Epsilon=0.935718 Action_times=671348 Epoche=144\n",
      "Epsilon=0.935499 Action_times=673714 Epoche=145\n",
      "Epsilon=0.934963 Action_times=679517 Epoche=146\n",
      "Epsilon=0.934786 Action_times=681426 Epoche=147\n",
      "Epsilon=0.934664 Action_times=682749 Epoche=148\n",
      "Epsilon=0.934386 Action_times=685754 Epoche=149\n",
      "Epsilon=0.934360 Action_times=686029 Epoche=150\n",
      "Epsilon=0.933936 Action_times=690620 Epoche=151\n",
      "Epsilon=0.933881 Action_times=691217 Epoche=152\n",
      "Epsilon=0.933734 Action_times=692809 Epoche=153\n",
      "Epsilon=0.933627 Action_times=693970 Epoche=154\n",
      "Epsilon=0.933582 Action_times=694458 Epoche=155\n",
      "Epsilon=0.933102 Action_times=699656 Epoche=156\n",
      "Epsilon=0.932891 Action_times=701942 Epoche=157\n",
      "Epsilon=0.932563 Action_times=705498 Epoche=158\n",
      "Epsilon=0.932333 Action_times=707983 Epoche=159\n",
      "Epsilon=0.932042 Action_times=711138 Epoche=160\n",
      "Epsilon=0.931836 Action_times=713380 Epoche=161\n",
      "Epsilon=0.931511 Action_times=716907 Epoche=162\n",
      "Epsilon=0.931281 Action_times=719394 Epoche=163\n",
      "Epsilon=0.931098 Action_times=721384 Epoche=164\n",
      "Epsilon=0.930938 Action_times=723118 Epoche=165\n",
      "Epsilon=0.930658 Action_times=726166 Epoche=166\n",
      "Epsilon=0.930641 Action_times=726352 Epoche=167\n",
      "Epsilon=0.930334 Action_times=729684 Epoche=168\n",
      "Epsilon=0.929932 Action_times=734054 Epoche=169\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.929575 Action_times=737938 Epoche=170\n",
      "Epsilon=0.929440 Action_times=739402 Epoche=171\n",
      "Epsilon=0.929233 Action_times=741651 Epoche=172\n",
      "Epsilon=0.929117 Action_times=742910 Epoche=173\n",
      "Epsilon=0.928885 Action_times=745437 Epoche=174\n",
      "Epsilon=0.928750 Action_times=746913 Epoche=175\n",
      "Epsilon=0.928557 Action_times=749008 Epoche=176\n",
      "Epsilon=0.928075 Action_times=754264 Epoche=177\n",
      "Epsilon=0.927828 Action_times=756952 Epoche=178\n",
      "Epsilon=0.927700 Action_times=758340 Epoche=179\n",
      "Epsilon=0.927493 Action_times=760597 Epoche=180\n",
      "Epsilon=0.927200 Action_times=763798 Epoche=181\n",
      "Epsilon=0.926660 Action_times=769686 Epoche=182\n",
      "Epsilon=0.926391 Action_times=772623 Epoche=183\n",
      "Epsilon=0.926127 Action_times=775501 Epoche=184\n",
      "Epsilon=0.925687 Action_times=780303 Epoche=185\n",
      "Epsilon=0.925354 Action_times=783937 Epoche=186\n",
      "Epsilon=0.925240 Action_times=785189 Epoche=187\n",
      "Epsilon=0.925095 Action_times=786776 Epoche=188\n",
      "Epsilon=0.924955 Action_times=788302 Epoche=189\n",
      "Epsilon=0.924880 Action_times=789120 Epoche=190\n",
      "Epsilon=0.924722 Action_times=790846 Epoche=191\n",
      "Epsilon=0.924673 Action_times=791387 Epoche=192\n",
      "Epsilon=0.924352 Action_times=794892 Epoche=193\n",
      "Epsilon=0.924109 Action_times=797551 Epoche=194\n",
      "Epsilon=0.923811 Action_times=800807 Epoche=195\n",
      "Epsilon=0.923546 Action_times=803712 Epoche=196\n",
      "Epsilon=0.923376 Action_times=805576 Epoche=197\n",
      "Epsilon=0.923103 Action_times=808562 Epoche=198\n",
      "Epsilon=0.922812 Action_times=811752 Epoche=199\n",
      "Epsilon=0.922701 Action_times=812964 Epoche=200\n",
      "Epsilon=0.922521 Action_times=814934 Epoche=201\n",
      "Epsilon=0.922221 Action_times=818231 Epoche=202\n",
      "Epsilon=0.922191 Action_times=818552 Epoche=203\n",
      "Epsilon=0.921834 Action_times=822474 Epoche=204\n",
      "Epsilon=0.921705 Action_times=823887 Epoche=205\n",
      "Epsilon=0.921582 Action_times=825231 Epoche=206\n",
      "Epsilon=0.920909 Action_times=832624 Epoche=207\n",
      "Epsilon=0.920722 Action_times=834675 Epoche=208\n",
      "Epsilon=0.920431 Action_times=837867 Epoche=209\n",
      "Epsilon=0.920211 Action_times=840283 Epoche=210\n",
      "Epsilon=0.919992 Action_times=842686 Epoche=211\n",
      "Epsilon=0.919697 Action_times=845937 Epoche=212\n",
      "Epsilon=0.919550 Action_times=847550 Epoche=213\n",
      "Epsilon=0.918939 Action_times=854272 Epoche=214\n",
      "Epsilon=0.918662 Action_times=857322 Epoche=215\n",
      "Epsilon=0.918557 Action_times=858474 Epoche=216\n",
      "Epsilon=0.918342 Action_times=860835 Epoche=217\n",
      "Epsilon=0.918025 Action_times=864325 Epoche=218\n",
      "Epsilon=0.917829 Action_times=866488 Epoche=219\n",
      "Epsilon=0.917144 Action_times=874040 Epoche=220\n",
      "Epsilon=0.916848 Action_times=877304 Epoche=221\n",
      "Epsilon=0.916542 Action_times=880676 Epoche=222\n",
      "Epsilon=0.916228 Action_times=884143 Epoche=223\n",
      "Epsilon=0.916098 Action_times=885574 Epoche=224\n",
      "Epsilon=0.915978 Action_times=886896 Epoche=225\n",
      "Epsilon=0.915821 Action_times=888636 Epoche=226\n",
      "Epsilon=0.915626 Action_times=890784 Epoche=227\n",
      "Epsilon=0.915274 Action_times=894674 Epoche=228\n",
      "Epsilon=0.915022 Action_times=897454 Epoche=229\n",
      "Epsilon=0.914848 Action_times=899377 Epoche=230\n",
      "Epsilon=0.914262 Action_times=905862 Epoche=231\n",
      "Epsilon=0.913980 Action_times=908975 Epoche=232\n",
      "Epsilon=0.913662 Action_times=912499 Epoche=233\n",
      "Epsilon=0.913331 Action_times=916161 Epoche=234\n",
      "Epsilon=0.913203 Action_times=917577 Epoche=235\n",
      "Epsilon=0.913087 Action_times=918866 Epoche=236\n",
      "Epsilon=0.913042 Action_times=919355 Epoche=237\n",
      "Epsilon=0.912768 Action_times=922397 Epoche=238\n",
      "Epsilon=0.912752 Action_times=922571 Epoche=239\n",
      "Epsilon=0.912565 Action_times=924640 Epoche=240\n",
      "Epsilon=0.912240 Action_times=928239 Epoche=241\n",
      "Epsilon=0.911991 Action_times=931004 Epoche=242\n",
      "Epsilon=0.911755 Action_times=933625 Epoche=243\n",
      "Epsilon=0.911491 Action_times=936552 Epoche=244\n",
      "Epsilon=0.911118 Action_times=940684 Epoche=245\n",
      "Epsilon=0.910911 Action_times=942987 Epoche=246\n",
      "Epsilon=0.910818 Action_times=944022 Epoche=247\n",
      "Epsilon=0.910775 Action_times=944491 Epoche=248\n",
      "Epsilon=0.910578 Action_times=946683 Epoche=249\n",
      "Epsilon=0.910290 Action_times=949885 Epoche=250\n",
      "Epsilon=0.910066 Action_times=952368 Epoche=251\n",
      "Epsilon=0.909918 Action_times=954014 Epoche=252\n",
      "Epsilon=0.909831 Action_times=954980 Epoche=253\n",
      "Epsilon=0.909728 Action_times=956119 Epoche=254\n",
      "Epsilon=0.909452 Action_times=959187 Epoche=255\n",
      "Epsilon=0.909216 Action_times=961818 Epoche=256\n",
      "Epsilon=0.909059 Action_times=963568 Epoche=257\n",
      "Epsilon=0.908883 Action_times=965516 Epoche=258\n",
      "Epsilon=0.908627 Action_times=968372 Epoche=259\n",
      "Epsilon=0.908372 Action_times=971203 Epoche=260\n",
      "Epsilon=0.908223 Action_times=972871 Epoche=261\n",
      "Epsilon=0.908175 Action_times=973396 Epoche=262\n",
      "Epsilon=0.908067 Action_times=974602 Epoche=263\n",
      "Epsilon=0.908053 Action_times=974761 Epoche=264\n",
      "Epsilon=0.907961 Action_times=975783 Epoche=265\n",
      "Epsilon=0.907806 Action_times=977514 Epoche=266\n",
      "Epsilon=0.907716 Action_times=978516 Epoche=267\n",
      "Epsilon=0.907662 Action_times=979108 Epoche=268\n",
      "Epsilon=0.907611 Action_times=979682 Epoche=269\n",
      "Epsilon=0.907503 Action_times=980890 Epoche=270\n",
      "Epsilon=0.907364 Action_times=982436 Epoche=271\n",
      "Epsilon=0.907301 Action_times=983141 Epoche=272\n",
      "Epsilon=0.907180 Action_times=984488 Epoche=273\n",
      "Epsilon=0.906958 Action_times=986955 Epoche=274\n",
      "Epsilon=0.906800 Action_times=988719 Epoche=275\n",
      "Epsilon=0.906720 Action_times=989612 Epoche=276\n",
      "Epsilon=0.906615 Action_times=990780 Epoche=277\n",
      "Epsilon=0.906555 Action_times=991450 Epoche=278\n",
      "Epsilon=0.906370 Action_times=993517 Epoche=279\n",
      "Epsilon=0.906110 Action_times=996417 Epoche=280\n",
      "Epsilon=0.905903 Action_times=998726 Epoche=281\n",
      "Epsilon=0.905877 Action_times=999017 Epoche=282\n",
      "Epsilon=0.905451 Action_times=1003779 Epoche=283\n",
      "Epsilon=0.905207 Action_times=1006502 Epoche=284\n",
      "Epsilon=0.905142 Action_times=1007224 Epoche=285\n",
      "Epsilon=0.904859 Action_times=1010393 Epoche=286\n",
      "Epsilon=0.904823 Action_times=1010791 Epoche=287\n",
      "Epsilon=0.904611 Action_times=1013155 Epoche=288\n",
      "Epsilon=0.904589 Action_times=1013407 Epoche=289\n",
      "Epsilon=0.904383 Action_times=1015705 Epoche=290\n",
      "Epsilon=0.904186 Action_times=1017912 Epoche=291\n",
      "Epsilon=0.904041 Action_times=1019536 Epoche=292\n",
      "Epsilon=0.903900 Action_times=1021115 Epoche=293\n",
      "Epsilon=0.903652 Action_times=1023890 Epoche=294\n",
      "Epsilon=0.903573 Action_times=1024768 Epoche=295\n",
      "Epsilon=0.903461 Action_times=1026027 Epoche=296\n",
      "Epsilon=0.903190 Action_times=1029056 Epoche=297\n",
      "Epsilon=0.903026 Action_times=1030893 Epoche=298\n",
      "Epsilon=0.902988 Action_times=1031317 Epoche=299\n",
      "Epsilon=0.902849 Action_times=1032876 Epoche=300\n",
      "Epsilon=0.902682 Action_times=1034743 Epoche=301\n",
      "Epsilon=0.902636 Action_times=1035266 Epoche=302\n",
      "Epsilon=0.902530 Action_times=1036444 Epoche=303\n",
      "Epsilon=0.902200 Action_times=1040146 Epoche=304\n",
      "Epsilon=0.901927 Action_times=1043204 Epoche=305\n",
      "Epsilon=0.901793 Action_times=1044704 Epoche=306\n",
      "Epsilon=0.901668 Action_times=1046108 Epoche=307\n",
      "Epsilon=0.901581 Action_times=1047087 Epoche=308\n",
      "Epsilon=0.901526 Action_times=1047707 Epoche=309\n",
      "Epsilon=0.901405 Action_times=1049057 Epoche=310\n",
      "Epsilon=0.901119 Action_times=1052272 Epoche=311\n",
      "Epsilon=0.900882 Action_times=1054933 Epoche=312\n",
      "Epsilon=0.900740 Action_times=1056520 Epoche=313\n",
      "Epsilon=0.900640 Action_times=1057644 Epoche=314\n",
      "Epsilon=0.900396 Action_times=1060382 Epoche=315\n",
      "Epsilon=0.900211 Action_times=1062462 Epoche=316\n",
      "Epsilon=0.900144 Action_times=1063212 Epoche=317\n",
      "Epsilon=0.899963 Action_times=1065253 Epoche=318\n",
      "Epsilon=0.899674 Action_times=1068499 Epoche=319\n",
      "Epsilon=0.899422 Action_times=1071333 Epoche=320\n",
      "Epsilon=0.899255 Action_times=1073210 Epoche=321\n",
      "Epsilon=0.898892 Action_times=1077295 Epoche=322\n",
      "Epsilon=0.898786 Action_times=1078489 Epoche=323\n",
      "Epsilon=0.898727 Action_times=1079153 Epoche=324\n",
      "Epsilon=0.898235 Action_times=1084687 Epoche=325\n",
      "Epsilon=0.897983 Action_times=1087527 Epoche=326\n",
      "Epsilon=0.897531 Action_times=1092610 Epoche=327\n",
      "Epsilon=0.897117 Action_times=1097283 Epoche=328\n",
      "Epsilon=0.896973 Action_times=1098901 Epoche=329\n",
      "Epsilon=0.896624 Action_times=1102834 Epoche=330\n",
      "Epsilon=0.896240 Action_times=1107171 Epoche=331\n",
      "Epsilon=0.895854 Action_times=1111524 Epoche=332\n",
      "Epsilon=0.895729 Action_times=1112943 Epoche=333\n",
      "Epsilon=0.895495 Action_times=1115579 Epoche=334\n",
      "Epsilon=0.895220 Action_times=1118688 Epoche=335\n",
      "Epsilon=0.895061 Action_times=1120485 Epoche=336\n",
      "Epsilon=0.894651 Action_times=1125114 Epoche=337\n",
      "Epsilon=0.894369 Action_times=1128304 Epoche=338\n",
      "Epsilon=0.893849 Action_times=1134186 Epoche=339\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.893418 Action_times=1139061 Epoche=340\n",
      "Epsilon=0.893284 Action_times=1140577 Epoche=341\n",
      "Epsilon=0.893167 Action_times=1141904 Epoche=342\n",
      "Epsilon=0.893007 Action_times=1143713 Epoche=343\n",
      "Epsilon=0.892825 Action_times=1145781 Epoche=344\n",
      "Epsilon=0.892642 Action_times=1147847 Epoche=345\n",
      "Epsilon=0.892551 Action_times=1148882 Epoche=346\n",
      "Epsilon=0.892325 Action_times=1151447 Epoche=347\n",
      "Epsilon=0.892235 Action_times=1152464 Epoche=348\n",
      "Epsilon=0.892088 Action_times=1154127 Epoche=349\n",
      "Epsilon=0.891657 Action_times=1159014 Epoche=350\n",
      "Epsilon=0.891546 Action_times=1160277 Epoche=351\n",
      "Epsilon=0.891217 Action_times=1164007 Epoche=352\n",
      "Epsilon=0.890872 Action_times=1167921 Epoche=353\n",
      "Epsilon=0.890834 Action_times=1168357 Epoche=354\n",
      "Epsilon=0.890820 Action_times=1168520 Epoche=355\n",
      "Epsilon=0.890525 Action_times=1171866 Epoche=356\n",
      "Epsilon=0.890342 Action_times=1173948 Epoche=357\n",
      "Epsilon=0.890293 Action_times=1174506 Epoche=358\n",
      "Epsilon=0.890120 Action_times=1176468 Epoche=359\n",
      "Epsilon=0.890040 Action_times=1177376 Epoche=360\n",
      "Epsilon=0.889700 Action_times=1181241 Epoche=361\n",
      "Epsilon=0.889504 Action_times=1183469 Epoche=362\n",
      "Epsilon=0.889157 Action_times=1187413 Epoche=363\n",
      "Epsilon=0.889138 Action_times=1187629 Epoche=364\n",
      "Epsilon=0.888898 Action_times=1190358 Epoche=365\n",
      "Epsilon=0.888805 Action_times=1191416 Epoche=366\n",
      "Epsilon=0.888709 Action_times=1192512 Epoche=367\n",
      "Epsilon=0.888386 Action_times=1196188 Epoche=368\n",
      "Epsilon=0.888269 Action_times=1197522 Epoche=369\n",
      "Epsilon=0.888119 Action_times=1199227 Epoche=370\n",
      "Epsilon=0.887850 Action_times=1202287 Epoche=371\n",
      "Epsilon=0.887624 Action_times=1204867 Epoche=372\n",
      "Epsilon=0.887587 Action_times=1205291 Epoche=373\n",
      "Epsilon=0.887461 Action_times=1206725 Epoche=374\n",
      "Epsilon=0.887289 Action_times=1208680 Epoche=375\n",
      "Epsilon=0.887121 Action_times=1210603 Epoche=376\n",
      "Epsilon=0.886820 Action_times=1214030 Epoche=377\n",
      "Epsilon=0.886705 Action_times=1215344 Epoche=378\n",
      "Epsilon=0.886608 Action_times=1216450 Epoche=379\n",
      "Epsilon=0.886409 Action_times=1218717 Epoche=380\n",
      "Epsilon=0.886246 Action_times=1220576 Epoche=381\n",
      "Epsilon=0.886019 Action_times=1223166 Epoche=382\n",
      "Epsilon=0.885873 Action_times=1224834 Epoche=383\n",
      "Epsilon=0.885645 Action_times=1227443 Epoche=384\n",
      "Epsilon=0.885528 Action_times=1228773 Epoche=385\n",
      "Epsilon=0.885439 Action_times=1229791 Epoche=386\n",
      "Epsilon=0.885290 Action_times=1231492 Epoche=387\n",
      "Epsilon=0.885127 Action_times=1233359 Epoche=388\n",
      "Epsilon=0.885106 Action_times=1233603 Epoche=389\n",
      "Epsilon=0.884994 Action_times=1234877 Epoche=390\n",
      "Epsilon=0.884987 Action_times=1234954 Epoche=391\n",
      "Epsilon=0.884836 Action_times=1236685 Epoche=392\n",
      "Epsilon=0.884661 Action_times=1238686 Epoche=393\n",
      "Epsilon=0.884577 Action_times=1239645 Epoche=394\n",
      "Epsilon=0.884350 Action_times=1242245 Epoche=395\n",
      "Epsilon=0.884183 Action_times=1244155 Epoche=396\n",
      "Epsilon=0.884151 Action_times=1244521 Epoche=397\n",
      "Epsilon=0.884068 Action_times=1245470 Epoche=398\n",
      "Epsilon=0.883870 Action_times=1247730 Epoche=399\n",
      "Epsilon=0.883736 Action_times=1249272 Epoche=400\n",
      "Epsilon=0.883535 Action_times=1251573 Epoche=401\n",
      "Epsilon=0.883494 Action_times=1252040 Epoche=402\n",
      "Epsilon=0.883423 Action_times=1252844 Epoche=403\n",
      "Epsilon=0.883369 Action_times=1253467 Epoche=404\n",
      "Epsilon=0.883316 Action_times=1254073 Epoche=405\n",
      "Epsilon=0.883120 Action_times=1256314 Epoche=406\n",
      "Epsilon=0.883063 Action_times=1256967 Epoche=407\n",
      "Epsilon=0.882909 Action_times=1258734 Epoche=408\n",
      "Epsilon=0.882757 Action_times=1260479 Epoche=409\n",
      "Epsilon=0.882746 Action_times=1260608 Epoche=410\n",
      "Epsilon=0.882619 Action_times=1262060 Epoche=411\n",
      "Epsilon=0.882548 Action_times=1262875 Epoche=412\n",
      "Epsilon=0.882458 Action_times=1263902 Epoche=413\n",
      "Epsilon=0.882369 Action_times=1264919 Epoche=414\n",
      "Epsilon=0.882254 Action_times=1266242 Epoche=415\n",
      "Epsilon=0.882179 Action_times=1267104 Epoche=416\n",
      "Epsilon=0.882104 Action_times=1267963 Epoche=417\n",
      "Epsilon=0.881983 Action_times=1269353 Epoche=418\n",
      "Epsilon=0.881901 Action_times=1270286 Epoche=419\n",
      "Epsilon=0.881726 Action_times=1272298 Epoche=420\n",
      "Epsilon=0.881714 Action_times=1272431 Epoche=421\n",
      "Epsilon=0.881602 Action_times=1273718 Epoche=422\n",
      "Epsilon=0.881551 Action_times=1274307 Epoche=423\n",
      "Epsilon=0.881340 Action_times=1276729 Epoche=424\n",
      "Epsilon=0.881285 Action_times=1277355 Epoche=425\n",
      "Epsilon=0.881110 Action_times=1279365 Epoche=426\n",
      "Epsilon=0.881055 Action_times=1280003 Epoche=427\n",
      "Epsilon=0.880938 Action_times=1281341 Epoche=428\n",
      "Epsilon=0.880862 Action_times=1282219 Epoche=429\n",
      "Epsilon=0.880717 Action_times=1283885 Epoche=430\n",
      "Epsilon=0.880433 Action_times=1287145 Epoche=431\n",
      "Epsilon=0.880327 Action_times=1288354 Epoche=432\n",
      "Epsilon=0.880279 Action_times=1288906 Epoche=433\n",
      "Epsilon=0.880154 Action_times=1290353 Epoche=434\n",
      "Epsilon=0.880115 Action_times=1290791 Epoche=435\n",
      "Epsilon=0.879993 Action_times=1292193 Epoche=436\n",
      "Epsilon=0.879921 Action_times=1293021 Epoche=437\n",
      "Epsilon=0.879695 Action_times=1295620 Epoche=438\n",
      "Epsilon=0.879513 Action_times=1297712 Epoche=439\n",
      "Epsilon=0.879435 Action_times=1298608 Epoche=440\n",
      "Epsilon=0.879277 Action_times=1300435 Epoche=441\n",
      "Epsilon=0.878975 Action_times=1303911 Epoche=442\n",
      "Epsilon=0.878869 Action_times=1305122 Epoche=443\n",
      "Epsilon=0.878753 Action_times=1306461 Epoche=444\n",
      "Epsilon=0.878582 Action_times=1308431 Epoche=445\n",
      "Epsilon=0.878405 Action_times=1310467 Epoche=446\n",
      "Epsilon=0.878028 Action_times=1314815 Epoche=447\n",
      "Epsilon=0.877619 Action_times=1319523 Epoche=448\n",
      "Epsilon=0.877543 Action_times=1320403 Epoche=449\n",
      "Epsilon=0.877451 Action_times=1321460 Epoche=450\n",
      "Epsilon=0.877163 Action_times=1324778 Epoche=451\n",
      "Epsilon=0.877058 Action_times=1325990 Epoche=452\n",
      "Epsilon=0.876934 Action_times=1327417 Epoche=453\n",
      "Epsilon=0.876766 Action_times=1329360 Epoche=454\n",
      "Epsilon=0.876713 Action_times=1329976 Epoche=455\n",
      "Epsilon=0.876457 Action_times=1332928 Epoche=456\n",
      "Epsilon=0.876402 Action_times=1333558 Epoche=457\n",
      "Epsilon=0.876398 Action_times=1333604 Epoche=458\n",
      "Epsilon=0.876258 Action_times=1335217 Epoche=459\n",
      "Epsilon=0.876110 Action_times=1336929 Epoche=460\n",
      "Epsilon=0.876099 Action_times=1337052 Epoche=461\n",
      "Epsilon=0.875946 Action_times=1338826 Epoche=462\n",
      "Epsilon=0.875766 Action_times=1340905 Epoche=463\n",
      "Epsilon=0.875504 Action_times=1343925 Epoche=464\n",
      "Epsilon=0.875404 Action_times=1345088 Epoche=465\n",
      "Epsilon=0.875238 Action_times=1347004 Epoche=466\n",
      "Epsilon=0.875009 Action_times=1349656 Epoche=467\n",
      "Epsilon=0.874846 Action_times=1351535 Epoche=468\n",
      "Epsilon=0.874702 Action_times=1353197 Epoche=469\n",
      "Epsilon=0.874616 Action_times=1354192 Epoche=470\n",
      "Epsilon=0.874269 Action_times=1358207 Epoche=471\n",
      "Epsilon=0.873909 Action_times=1362371 Epoche=472\n",
      "Epsilon=0.873843 Action_times=1363141 Epoche=473\n",
      "Epsilon=0.873754 Action_times=1364175 Epoche=474\n",
      "Epsilon=0.873401 Action_times=1368254 Epoche=475\n",
      "Epsilon=0.873301 Action_times=1369411 Epoche=476\n",
      "Epsilon=0.873140 Action_times=1371281 Epoche=477\n",
      "Epsilon=0.873116 Action_times=1371553 Epoche=478\n",
      "Epsilon=0.873024 Action_times=1372621 Epoche=479\n",
      "Epsilon=0.872913 Action_times=1373907 Epoche=480\n",
      "Epsilon=0.872764 Action_times=1375643 Epoche=481\n",
      "Epsilon=0.872557 Action_times=1378041 Epoche=482\n",
      "Epsilon=0.872546 Action_times=1378163 Epoche=483\n",
      "Epsilon=0.872451 Action_times=1379269 Epoche=484\n",
      "Epsilon=0.872322 Action_times=1380766 Epoche=485\n",
      "Epsilon=0.872319 Action_times=1380802 Epoche=486\n",
      "Epsilon=0.872243 Action_times=1381673 Epoche=487\n",
      "Epsilon=0.872158 Action_times=1382659 Epoche=488\n",
      "Epsilon=0.872050 Action_times=1383915 Epoche=489\n",
      "Epsilon=0.871684 Action_times=1388166 Epoche=490\n",
      "Epsilon=0.871361 Action_times=1391912 Epoche=491\n",
      "Epsilon=0.871212 Action_times=1393643 Epoche=492\n",
      "Epsilon=0.870925 Action_times=1396978 Epoche=493\n",
      "Epsilon=0.870753 Action_times=1398976 Epoche=494\n",
      "Epsilon=0.870611 Action_times=1400619 Epoche=495\n",
      "Epsilon=0.870589 Action_times=1400881 Epoche=496\n",
      "Epsilon=0.870451 Action_times=1402484 Epoche=497\n",
      "Epsilon=0.870317 Action_times=1404036 Epoche=498\n",
      "Epsilon=0.870199 Action_times=1405411 Epoche=499\n",
      "Epsilon=0.870131 Action_times=1406201 Epoche=500\n",
      "Epsilon=0.870108 Action_times=1406470 Epoche=501\n",
      "Epsilon=0.869991 Action_times=1407826 Epoche=502\n",
      "Epsilon=0.869801 Action_times=1410034 Epoche=503\n",
      "Epsilon=0.869576 Action_times=1412656 Epoche=504\n",
      "Epsilon=0.869466 Action_times=1413938 Epoche=505\n",
      "Epsilon=0.869366 Action_times=1415100 Epoche=506\n",
      "Epsilon=0.869087 Action_times=1418349 Epoche=507\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.868940 Action_times=1420062 Epoche=508\n",
      "Epsilon=0.868853 Action_times=1421074 Epoche=509\n",
      "Epsilon=0.868792 Action_times=1421778 Epoche=510\n",
      "Epsilon=0.868628 Action_times=1423696 Epoche=511\n",
      "Epsilon=0.868303 Action_times=1427472 Epoche=512\n",
      "Epsilon=0.868207 Action_times=1428600 Epoche=513\n",
      "Epsilon=0.868145 Action_times=1429321 Epoche=514\n",
      "Epsilon=0.867987 Action_times=1431162 Epoche=515\n",
      "Epsilon=0.867977 Action_times=1431272 Epoche=516\n",
      "Epsilon=0.867739 Action_times=1434053 Epoche=517\n",
      "Epsilon=0.867510 Action_times=1436723 Epoche=518\n",
      "Epsilon=0.867313 Action_times=1439023 Epoche=519\n",
      "Epsilon=0.867130 Action_times=1441152 Epoche=520\n",
      "Epsilon=0.866931 Action_times=1443477 Epoche=521\n",
      "Epsilon=0.866730 Action_times=1445820 Epoche=522\n",
      "Epsilon=0.866576 Action_times=1447621 Epoche=523\n",
      "Epsilon=0.866403 Action_times=1449634 Epoche=524\n",
      "Epsilon=0.866384 Action_times=1449857 Epoche=525\n",
      "Epsilon=0.866314 Action_times=1450677 Epoche=526\n",
      "Epsilon=0.866265 Action_times=1451253 Epoche=527\n",
      "Epsilon=0.866140 Action_times=1452707 Epoche=528\n",
      "Epsilon=0.865947 Action_times=1454963 Epoche=529\n",
      "Epsilon=0.865904 Action_times=1455472 Epoche=530\n",
      "Epsilon=0.865770 Action_times=1457032 Epoche=531\n",
      "Epsilon=0.865658 Action_times=1458346 Epoche=532\n",
      "Epsilon=0.865530 Action_times=1459841 Epoche=533\n",
      "Epsilon=0.865467 Action_times=1460580 Epoche=534\n",
      "Epsilon=0.865185 Action_times=1463869 Epoche=535\n",
      "Epsilon=0.865147 Action_times=1464314 Epoche=536\n",
      "Epsilon=0.864838 Action_times=1467924 Epoche=537\n",
      "Epsilon=0.864520 Action_times=1471653 Epoche=538\n",
      "Epsilon=0.864360 Action_times=1473527 Epoche=539\n",
      "Epsilon=0.864260 Action_times=1474692 Epoche=540\n",
      "Epsilon=0.864137 Action_times=1476131 Epoche=541\n",
      "Epsilon=0.863899 Action_times=1478917 Epoche=542\n",
      "Epsilon=0.863820 Action_times=1479847 Epoche=543\n",
      "Epsilon=0.863651 Action_times=1481823 Epoche=544\n",
      "Epsilon=0.863542 Action_times=1483105 Epoche=545\n",
      "Epsilon=0.863423 Action_times=1484500 Epoche=546\n",
      "Epsilon=0.863327 Action_times=1485625 Epoche=547\n",
      "Epsilon=0.863181 Action_times=1487337 Epoche=548\n",
      "Epsilon=0.863073 Action_times=1488595 Epoche=549\n",
      "Epsilon=0.862994 Action_times=1489519 Epoche=550\n",
      "Epsilon=0.862843 Action_times=1491296 Epoche=551\n",
      "Epsilon=0.862735 Action_times=1492563 Epoche=552\n",
      "Epsilon=0.862691 Action_times=1493074 Epoche=553\n",
      "Epsilon=0.862678 Action_times=1493229 Epoche=554\n",
      "Epsilon=0.862612 Action_times=1494004 Epoche=555\n",
      "Epsilon=0.862438 Action_times=1496043 Epoche=556\n",
      "Epsilon=0.862332 Action_times=1497293 Epoche=557\n",
      "Epsilon=0.862288 Action_times=1497803 Epoche=558\n",
      "Epsilon=0.862185 Action_times=1499015 Epoche=559\n",
      "Epsilon=0.861962 Action_times=1501628 Epoche=560\n",
      "Epsilon=0.861758 Action_times=1504027 Epoche=561\n",
      "Epsilon=0.861525 Action_times=1506762 Epoche=562\n",
      "Epsilon=0.861402 Action_times=1508211 Epoche=563\n",
      "Epsilon=0.861202 Action_times=1510552 Epoche=564\n",
      "Epsilon=0.861003 Action_times=1512898 Epoche=565\n",
      "Epsilon=0.860937 Action_times=1513670 Epoche=566\n",
      "Epsilon=0.860872 Action_times=1514429 Epoche=567\n",
      "Epsilon=0.860843 Action_times=1514774 Epoche=568\n",
      "Epsilon=0.860602 Action_times=1517607 Epoche=569\n",
      "Epsilon=0.860407 Action_times=1519899 Epoche=570\n",
      "Epsilon=0.860153 Action_times=1522885 Epoche=571\n",
      "Epsilon=0.860051 Action_times=1524090 Epoche=572\n",
      "Epsilon=0.859867 Action_times=1526251 Epoche=573\n",
      "Epsilon=0.859839 Action_times=1526575 Epoche=574\n",
      "Epsilon=0.859733 Action_times=1527823 Epoche=575\n",
      "Epsilon=0.859700 Action_times=1528218 Epoche=576\n",
      "Epsilon=0.859518 Action_times=1530358 Epoche=577\n",
      "Epsilon=0.859435 Action_times=1531338 Epoche=578\n",
      "Epsilon=0.859306 Action_times=1532857 Epoche=579\n",
      "Epsilon=0.859157 Action_times=1534609 Epoche=580\n",
      "Epsilon=0.858841 Action_times=1538328 Epoche=581\n",
      "Epsilon=0.858788 Action_times=1538952 Epoche=582\n",
      "Epsilon=0.858676 Action_times=1540277 Epoche=583\n",
      "Epsilon=0.858605 Action_times=1541112 Epoche=584\n",
      "Epsilon=0.858497 Action_times=1542383 Epoche=585\n",
      "Epsilon=0.858399 Action_times=1543535 Epoche=586\n",
      "Epsilon=0.858294 Action_times=1544773 Epoche=587\n",
      "Epsilon=0.858068 Action_times=1547441 Epoche=588\n",
      "Epsilon=0.857854 Action_times=1549967 Epoche=589\n",
      "Epsilon=0.857720 Action_times=1551541 Epoche=590\n",
      "Epsilon=0.857643 Action_times=1552456 Epoche=591\n",
      "Epsilon=0.857599 Action_times=1552977 Epoche=592\n",
      "Epsilon=0.857537 Action_times=1553700 Epoche=593\n",
      "Epsilon=0.857404 Action_times=1555277 Epoche=594\n",
      "Epsilon=0.857267 Action_times=1556896 Epoche=595\n",
      "Epsilon=0.857256 Action_times=1557020 Epoche=596\n",
      "Epsilon=0.857228 Action_times=1557356 Epoche=597\n",
      "Epsilon=0.857020 Action_times=1559811 Epoche=598\n",
      "Epsilon=0.856819 Action_times=1562185 Epoche=599\n",
      "Epsilon=0.856743 Action_times=1563072 Epoche=600\n",
      "Epsilon=0.856643 Action_times=1564260 Epoche=601\n",
      "Epsilon=0.856236 Action_times=1569066 Epoche=602\n",
      "Epsilon=0.856096 Action_times=1570718 Epoche=603\n",
      "Epsilon=0.855977 Action_times=1572132 Epoche=604\n",
      "Epsilon=0.855717 Action_times=1575204 Epoche=605\n",
      "Epsilon=0.855634 Action_times=1576179 Epoche=606\n",
      "Epsilon=0.855422 Action_times=1578696 Epoche=607\n",
      "Epsilon=0.855391 Action_times=1579056 Epoche=608\n",
      "Epsilon=0.855332 Action_times=1579754 Epoche=609\n",
      "Epsilon=0.855275 Action_times=1580430 Epoche=610\n",
      "Epsilon=0.855253 Action_times=1580689 Epoche=611\n",
      "Epsilon=0.855075 Action_times=1582796 Epoche=612\n",
      "Epsilon=0.854960 Action_times=1584157 Epoche=613\n",
      "Epsilon=0.854729 Action_times=1586893 Epoche=614\n",
      "Epsilon=0.854583 Action_times=1588615 Epoche=615\n",
      "Epsilon=0.854395 Action_times=1590847 Epoche=616\n",
      "Epsilon=0.854260 Action_times=1592440 Epoche=617\n",
      "Epsilon=0.854144 Action_times=1593815 Epoche=618\n",
      "Epsilon=0.854010 Action_times=1595408 Epoche=619\n",
      "Epsilon=0.853919 Action_times=1596489 Epoche=620\n",
      "Epsilon=0.853747 Action_times=1598520 Epoche=621\n",
      "Epsilon=0.853543 Action_times=1600937 Epoche=622\n",
      "Epsilon=0.853465 Action_times=1601868 Epoche=623\n",
      "Epsilon=0.853223 Action_times=1604738 Epoche=624\n",
      "Epsilon=0.853196 Action_times=1605050 Epoche=625\n",
      "Epsilon=0.853038 Action_times=1606928 Epoche=626\n",
      "Epsilon=0.852938 Action_times=1608115 Epoche=627\n",
      "Epsilon=0.852735 Action_times=1610518 Epoche=628\n",
      "Epsilon=0.852687 Action_times=1611090 Epoche=629\n",
      "Epsilon=0.852604 Action_times=1612082 Epoche=630\n",
      "Epsilon=0.852493 Action_times=1613394 Epoche=631\n",
      "Epsilon=0.852428 Action_times=1614164 Epoche=632\n",
      "Epsilon=0.852278 Action_times=1615943 Epoche=633\n",
      "Epsilon=0.852071 Action_times=1618404 Epoche=634\n",
      "Epsilon=0.851983 Action_times=1619455 Epoche=635\n",
      "Epsilon=0.851941 Action_times=1619946 Epoche=636\n",
      "Epsilon=0.851884 Action_times=1620631 Epoche=637\n",
      "Epsilon=0.851840 Action_times=1621151 Epoche=638\n",
      "Epsilon=0.851744 Action_times=1622286 Epoche=639\n",
      "Epsilon=0.851601 Action_times=1623987 Epoche=640\n",
      "Epsilon=0.851542 Action_times=1624689 Epoche=641\n",
      "Epsilon=0.851478 Action_times=1625447 Epoche=642\n",
      "Epsilon=0.851422 Action_times=1626114 Epoche=643\n",
      "Epsilon=0.851384 Action_times=1626569 Epoche=644\n",
      "Epsilon=0.851312 Action_times=1627425 Epoche=645\n",
      "Epsilon=0.851083 Action_times=1630149 Epoche=646\n",
      "Epsilon=0.850860 Action_times=1632794 Epoche=647\n",
      "Epsilon=0.850710 Action_times=1634584 Epoche=648\n",
      "Epsilon=0.850622 Action_times=1635628 Epoche=649\n",
      "Epsilon=0.850536 Action_times=1636648 Epoche=650\n",
      "Epsilon=0.850383 Action_times=1638472 Epoche=651\n",
      "Epsilon=0.850378 Action_times=1638530 Epoche=652\n",
      "Epsilon=0.850332 Action_times=1639081 Epoche=653\n",
      "Epsilon=0.850239 Action_times=1640183 Epoche=654\n",
      "Epsilon=0.850124 Action_times=1641559 Epoche=655\n",
      "Epsilon=0.849849 Action_times=1644833 Epoche=656\n",
      "Epsilon=0.849627 Action_times=1647468 Epoche=657\n",
      "Epsilon=0.849480 Action_times=1649219 Epoche=658\n",
      "Epsilon=0.849087 Action_times=1653906 Epoche=659\n",
      "Epsilon=0.848943 Action_times=1655624 Epoche=660\n",
      "Epsilon=0.848826 Action_times=1657019 Epoche=661\n",
      "Epsilon=0.848687 Action_times=1658677 Epoche=662\n",
      "Epsilon=0.848508 Action_times=1660812 Epoche=663\n",
      "Epsilon=0.848340 Action_times=1662813 Epoche=664\n",
      "Epsilon=0.848180 Action_times=1664720 Epoche=665\n",
      "Epsilon=0.848058 Action_times=1666171 Epoche=666\n",
      "Epsilon=0.847963 Action_times=1667313 Epoche=667\n",
      "Epsilon=0.847935 Action_times=1667641 Epoche=668\n",
      "Epsilon=0.847881 Action_times=1668290 Epoche=669\n",
      "Epsilon=0.847747 Action_times=1669888 Epoche=670\n",
      "Epsilon=0.847544 Action_times=1672313 Epoche=671\n",
      "Epsilon=0.847448 Action_times=1673461 Epoche=672\n",
      "Epsilon=0.847444 Action_times=1673502 Epoche=673\n",
      "Epsilon=0.847290 Action_times=1675350 Epoche=674\n",
      "Epsilon=0.847206 Action_times=1676352 Epoche=675\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.847112 Action_times=1677471 Epoche=676\n",
      "Epsilon=0.846999 Action_times=1678819 Epoche=677\n",
      "Epsilon=0.846983 Action_times=1679013 Epoche=678\n",
      "Epsilon=0.846932 Action_times=1679622 Epoche=679\n",
      "Epsilon=0.846890 Action_times=1680122 Epoche=680\n",
      "Epsilon=0.846841 Action_times=1680708 Epoche=681\n",
      "Epsilon=0.846771 Action_times=1681543 Epoche=682\n",
      "Epsilon=0.846702 Action_times=1682367 Epoche=683\n",
      "Epsilon=0.846594 Action_times=1683661 Epoche=684\n",
      "Epsilon=0.846590 Action_times=1683704 Epoche=685\n",
      "Epsilon=0.846519 Action_times=1684559 Epoche=686\n",
      "Epsilon=0.846441 Action_times=1685487 Epoche=687\n",
      "Epsilon=0.846274 Action_times=1687491 Epoche=688\n",
      "Epsilon=0.846141 Action_times=1689073 Epoche=689\n",
      "Epsilon=0.845998 Action_times=1690789 Epoche=690\n",
      "Epsilon=0.845843 Action_times=1692638 Epoche=691\n",
      "Epsilon=0.845804 Action_times=1693106 Epoche=692\n",
      "Epsilon=0.845711 Action_times=1694225 Epoche=693\n",
      "Epsilon=0.845659 Action_times=1694840 Epoche=694\n",
      "Epsilon=0.845475 Action_times=1697045 Epoche=695\n",
      "Epsilon=0.845406 Action_times=1697870 Epoche=696\n",
      "Epsilon=0.845167 Action_times=1700727 Epoche=697\n",
      "Epsilon=0.845045 Action_times=1702192 Epoche=698\n",
      "Epsilon=0.844823 Action_times=1704858 Epoche=699\n",
      "Epsilon=0.844651 Action_times=1706911 Epoche=700\n",
      "Epsilon=0.844546 Action_times=1708171 Epoche=701\n",
      "Epsilon=0.844286 Action_times=1711286 Epoche=702\n",
      "Epsilon=0.844102 Action_times=1713495 Epoche=703\n",
      "Epsilon=0.844043 Action_times=1714199 Epoche=704\n",
      "Epsilon=0.843903 Action_times=1715881 Epoche=705\n",
      "Epsilon=0.843647 Action_times=1718949 Epoche=706\n",
      "Epsilon=0.843492 Action_times=1720805 Epoche=707\n",
      "Epsilon=0.843355 Action_times=1722453 Epoche=708\n",
      "Epsilon=0.843016 Action_times=1726515 Epoche=709\n",
      "Epsilon=0.842858 Action_times=1728422 Epoche=710\n",
      "Epsilon=0.842661 Action_times=1730784 Epoche=711\n",
      "Epsilon=0.842622 Action_times=1731257 Epoche=712\n",
      "Epsilon=0.842481 Action_times=1732951 Epoche=713\n",
      "Epsilon=0.842429 Action_times=1733574 Epoche=714\n",
      "Epsilon=0.842369 Action_times=1734292 Epoche=715\n",
      "Epsilon=0.842175 Action_times=1736626 Epoche=716\n",
      "Epsilon=0.842101 Action_times=1737514 Epoche=717\n",
      "Epsilon=0.841899 Action_times=1739944 Epoche=718\n",
      "Epsilon=0.841873 Action_times=1740249 Epoche=719\n",
      "Epsilon=0.841696 Action_times=1742381 Epoche=720\n",
      "Epsilon=0.841556 Action_times=1744068 Epoche=721\n",
      "Epsilon=0.841534 Action_times=1744332 Epoche=722\n",
      "Epsilon=0.841364 Action_times=1746375 Epoche=723\n",
      "Epsilon=0.841339 Action_times=1746671 Epoche=724\n",
      "Epsilon=0.841179 Action_times=1748594 Epoche=725\n",
      "Epsilon=0.840967 Action_times=1751147 Epoche=726\n",
      "Epsilon=0.840892 Action_times=1752057 Epoche=727\n",
      "Epsilon=0.840831 Action_times=1752781 Epoche=728\n",
      "Epsilon=0.840648 Action_times=1754990 Epoche=729\n",
      "Epsilon=0.840502 Action_times=1756748 Epoche=730\n",
      "Epsilon=0.840416 Action_times=1757777 Epoche=731\n",
      "Epsilon=0.840170 Action_times=1760750 Epoche=732\n",
      "Epsilon=0.840067 Action_times=1761982 Epoche=733\n",
      "Epsilon=0.839991 Action_times=1762902 Epoche=734\n",
      "Epsilon=0.839914 Action_times=1763826 Epoche=735\n",
      "Epsilon=0.839768 Action_times=1765587 Epoche=736\n",
      "Epsilon=0.839645 Action_times=1767066 Epoche=737\n",
      "Epsilon=0.839549 Action_times=1768229 Epoche=738\n",
      "Epsilon=0.839155 Action_times=1772978 Epoche=739\n",
      "Epsilon=0.838950 Action_times=1775454 Epoche=740\n",
      "Epsilon=0.838774 Action_times=1777569 Epoche=741\n",
      "Epsilon=0.838582 Action_times=1779897 Epoche=742\n",
      "Epsilon=0.838483 Action_times=1781087 Epoche=743\n",
      "Epsilon=0.838397 Action_times=1782129 Epoche=744\n",
      "Epsilon=0.838268 Action_times=1783682 Epoche=745\n",
      "Epsilon=0.838145 Action_times=1785165 Epoche=746\n",
      "Epsilon=0.838055 Action_times=1786258 Epoche=747\n",
      "Epsilon=0.837838 Action_times=1788870 Epoche=748\n",
      "Epsilon=0.837676 Action_times=1790833 Epoche=749\n",
      "Epsilon=0.837654 Action_times=1791093 Epoche=750\n",
      "Epsilon=0.837585 Action_times=1791936 Epoche=751\n",
      "Epsilon=0.837420 Action_times=1793923 Epoche=752\n",
      "Epsilon=0.837277 Action_times=1795659 Epoche=753\n",
      "Epsilon=0.837239 Action_times=1796115 Epoche=754\n",
      "Epsilon=0.837129 Action_times=1797442 Epoche=755\n",
      "Epsilon=0.836928 Action_times=1799874 Epoche=756\n",
      "Epsilon=0.836741 Action_times=1802129 Epoche=757\n",
      "Epsilon=0.836719 Action_times=1802395 Epoche=758\n",
      "Epsilon=0.836558 Action_times=1804345 Epoche=759\n",
      "Epsilon=0.836445 Action_times=1805716 Epoche=760\n",
      "Epsilon=0.836293 Action_times=1807561 Epoche=761\n",
      "Epsilon=0.836200 Action_times=1808684 Epoche=762\n",
      "Epsilon=0.835989 Action_times=1811238 Epoche=763\n",
      "Epsilon=0.835836 Action_times=1813087 Epoche=764\n",
      "Epsilon=0.835782 Action_times=1813745 Epoche=765\n",
      "Epsilon=0.835711 Action_times=1814596 Epoche=766\n",
      "Epsilon=0.835690 Action_times=1814856 Epoche=767\n",
      "Epsilon=0.835576 Action_times=1816242 Epoche=768\n",
      "Epsilon=0.835312 Action_times=1819438 Epoche=769\n",
      "Epsilon=0.835108 Action_times=1821907 Epoche=770\n",
      "Epsilon=0.834925 Action_times=1824121 Epoche=771\n",
      "Epsilon=0.834849 Action_times=1825049 Epoche=772\n",
      "Epsilon=0.834550 Action_times=1828675 Epoche=773\n",
      "Epsilon=0.834452 Action_times=1829860 Epoche=774\n",
      "Epsilon=0.834360 Action_times=1830979 Epoche=775\n",
      "Epsilon=0.834225 Action_times=1832608 Epoche=776\n",
      "Epsilon=0.834208 Action_times=1832821 Epoche=777\n",
      "Epsilon=0.834191 Action_times=1833029 Epoche=778\n",
      "Epsilon=0.834115 Action_times=1833951 Epoche=779\n",
      "Epsilon=0.834049 Action_times=1834752 Epoche=780\n",
      "Epsilon=0.833997 Action_times=1835376 Epoche=781\n",
      "Epsilon=0.833947 Action_times=1835985 Epoche=782\n",
      "Epsilon=0.833720 Action_times=1838743 Epoche=783\n",
      "Epsilon=0.833692 Action_times=1839079 Epoche=784\n",
      "Epsilon=0.833637 Action_times=1839750 Epoche=785\n",
      "Epsilon=0.833603 Action_times=1840164 Epoche=786\n",
      "Epsilon=0.833503 Action_times=1841382 Epoche=787\n",
      "Epsilon=0.833387 Action_times=1842786 Epoche=788\n",
      "Epsilon=0.833355 Action_times=1843173 Epoche=789\n",
      "Epsilon=0.833333 Action_times=1843445 Epoche=790\n",
      "Epsilon=0.833302 Action_times=1843818 Epoche=791\n",
      "Epsilon=0.833265 Action_times=1844270 Epoche=792\n",
      "Epsilon=0.833194 Action_times=1845128 Epoche=793\n",
      "Epsilon=0.833063 Action_times=1846727 Epoche=794\n",
      "Epsilon=0.833007 Action_times=1847398 Epoche=795\n",
      "Epsilon=0.832880 Action_times=1848944 Epoche=796\n",
      "Epsilon=0.832839 Action_times=1849445 Epoche=797\n",
      "Epsilon=0.832446 Action_times=1854219 Epoche=798\n",
      "Epsilon=0.832294 Action_times=1856075 Epoche=799\n",
      "Epsilon=0.832219 Action_times=1856985 Epoche=800\n",
      "Epsilon=0.832147 Action_times=1857860 Epoche=801\n",
      "Epsilon=0.831991 Action_times=1859750 Epoche=802\n",
      "Epsilon=0.831882 Action_times=1861082 Epoche=803\n",
      "Epsilon=0.831735 Action_times=1862864 Epoche=804\n",
      "Epsilon=0.831570 Action_times=1864883 Epoche=805\n",
      "Epsilon=0.831440 Action_times=1866466 Epoche=806\n",
      "Epsilon=0.831364 Action_times=1867389 Epoche=807\n",
      "Epsilon=0.831285 Action_times=1868351 Epoche=808\n",
      "Epsilon=0.831069 Action_times=1870977 Epoche=809\n",
      "Epsilon=0.831026 Action_times=1871500 Epoche=810\n",
      "Epsilon=0.830841 Action_times=1873750 Epoche=811\n",
      "Epsilon=0.830673 Action_times=1875800 Epoche=812\n",
      "Epsilon=0.830484 Action_times=1878105 Epoche=813\n",
      "Epsilon=0.830347 Action_times=1879778 Epoche=814\n",
      "Epsilon=0.830257 Action_times=1880873 Epoche=815\n",
      "Epsilon=0.830182 Action_times=1881787 Epoche=816\n",
      "Epsilon=0.830104 Action_times=1882736 Epoche=817\n",
      "Epsilon=0.830050 Action_times=1883402 Epoche=818\n",
      "Epsilon=0.829920 Action_times=1884987 Epoche=819\n",
      "Epsilon=0.829876 Action_times=1885518 Epoche=820\n",
      "Epsilon=0.829814 Action_times=1886271 Epoche=821\n",
      "Epsilon=0.829728 Action_times=1887318 Epoche=822\n",
      "Epsilon=0.829390 Action_times=1891446 Epoche=823\n",
      "Epsilon=0.829291 Action_times=1892659 Epoche=824\n",
      "Epsilon=0.829258 Action_times=1893063 Epoche=825\n",
      "Epsilon=0.829169 Action_times=1894149 Epoche=826\n",
      "Epsilon=0.828949 Action_times=1896833 Epoche=827\n",
      "Epsilon=0.828665 Action_times=1900296 Epoche=828\n",
      "Epsilon=0.828637 Action_times=1900641 Epoche=829\n",
      "Epsilon=0.828491 Action_times=1902421 Epoche=830\n",
      "Epsilon=0.828358 Action_times=1904049 Epoche=831\n",
      "Epsilon=0.828282 Action_times=1904977 Epoche=832\n",
      "Epsilon=0.828236 Action_times=1905543 Epoche=833\n",
      "Epsilon=0.828183 Action_times=1906191 Epoche=834\n",
      "Epsilon=0.828081 Action_times=1907438 Epoche=835\n",
      "Epsilon=0.827823 Action_times=1910594 Epoche=836\n",
      "Epsilon=0.827716 Action_times=1911896 Epoche=837\n",
      "Epsilon=0.827694 Action_times=1912171 Epoche=838\n",
      "Epsilon=0.827591 Action_times=1913432 Epoche=839\n",
      "Epsilon=0.827562 Action_times=1913785 Epoche=840\n",
      "Epsilon=0.827481 Action_times=1914774 Epoche=841\n",
      "Epsilon=0.827450 Action_times=1915149 Epoche=842\n",
      "Epsilon=0.827418 Action_times=1915546 Epoche=843\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.827306 Action_times=1916911 Epoche=844\n",
      "Epsilon=0.826977 Action_times=1920940 Epoche=845\n",
      "Epsilon=0.826974 Action_times=1920978 Epoche=846\n",
      "Epsilon=0.826854 Action_times=1922441 Epoche=847\n",
      "Epsilon=0.826608 Action_times=1925452 Epoche=848\n",
      "Epsilon=0.826569 Action_times=1925934 Epoche=849\n",
      "Epsilon=0.826505 Action_times=1926718 Epoche=850\n",
      "Epsilon=0.826395 Action_times=1928068 Epoche=851\n",
      "Epsilon=0.826252 Action_times=1929815 Epoche=852\n",
      "Epsilon=0.826129 Action_times=1931326 Epoche=853\n",
      "Epsilon=0.825996 Action_times=1932949 Epoche=854\n",
      "Epsilon=0.825890 Action_times=1934248 Epoche=855\n",
      "Epsilon=0.825772 Action_times=1935695 Epoche=856\n",
      "Epsilon=0.825681 Action_times=1936812 Epoche=857\n",
      "Epsilon=0.825560 Action_times=1938302 Epoche=858\n",
      "Epsilon=0.825355 Action_times=1940816 Epoche=859\n",
      "Epsilon=0.825286 Action_times=1941658 Epoche=860\n",
      "Epsilon=0.825161 Action_times=1943192 Epoche=861\n",
      "Epsilon=0.824920 Action_times=1946154 Epoche=862\n",
      "Epsilon=0.824674 Action_times=1949175 Epoche=863\n",
      "Epsilon=0.824610 Action_times=1949951 Epoche=864\n",
      "Epsilon=0.824350 Action_times=1953153 Epoche=865\n",
      "Epsilon=0.824318 Action_times=1953540 Epoche=866\n",
      "Epsilon=0.824203 Action_times=1954958 Epoche=867\n",
      "Epsilon=0.823872 Action_times=1959023 Epoche=868\n",
      "Epsilon=0.823822 Action_times=1959629 Epoche=869\n",
      "Epsilon=0.823619 Action_times=1962127 Epoche=870\n",
      "Epsilon=0.823456 Action_times=1964130 Epoche=871\n",
      "Epsilon=0.823442 Action_times=1964308 Epoche=872\n",
      "Epsilon=0.823334 Action_times=1965637 Epoche=873\n",
      "Epsilon=0.823282 Action_times=1966268 Epoche=874\n",
      "Epsilon=0.823088 Action_times=1968654 Epoche=875\n",
      "Epsilon=0.822997 Action_times=1969776 Epoche=876\n",
      "Epsilon=0.822824 Action_times=1971905 Epoche=877\n",
      "Epsilon=0.822638 Action_times=1974187 Epoche=878\n",
      "Epsilon=0.822582 Action_times=1974883 Epoche=879\n",
      "Epsilon=0.822449 Action_times=1976514 Epoche=880\n",
      "Epsilon=0.822295 Action_times=1978417 Epoche=881\n",
      "Epsilon=0.822214 Action_times=1979416 Epoche=882\n",
      "Epsilon=0.822093 Action_times=1980896 Epoche=883\n",
      "Epsilon=0.821741 Action_times=1985240 Epoche=884\n",
      "Epsilon=0.821451 Action_times=1988810 Epoche=885\n",
      "Epsilon=0.821126 Action_times=1992821 Epoche=886\n",
      "Epsilon=0.820846 Action_times=1996269 Epoche=887\n",
      "Epsilon=0.820787 Action_times=1996991 Epoche=888\n",
      "Epsilon=0.820540 Action_times=2000041 Epoche=889\n",
      "Epsilon=0.820442 Action_times=2001249 Epoche=890\n",
      "Epsilon=0.820398 Action_times=2001800 Epoche=891\n",
      "Epsilon=0.820258 Action_times=2003525 Epoche=892\n",
      "Epsilon=0.820156 Action_times=2004778 Epoche=893\n",
      "Epsilon=0.820058 Action_times=2005988 Epoche=894\n",
      "Epsilon=0.819885 Action_times=2008125 Epoche=895\n",
      "Epsilon=0.819806 Action_times=2009106 Epoche=896\n",
      "Epsilon=0.819689 Action_times=2010545 Epoche=897\n",
      "Epsilon=0.819606 Action_times=2011567 Epoche=898\n",
      "Epsilon=0.819509 Action_times=2012768 Epoche=899\n",
      "Epsilon=0.819418 Action_times=2013900 Epoche=900\n",
      "Epsilon=0.819325 Action_times=2015043 Epoche=901\n",
      "Epsilon=0.819193 Action_times=2016673 Epoche=902\n",
      "Epsilon=0.819046 Action_times=2018489 Epoche=903\n",
      "Epsilon=0.819016 Action_times=2018865 Epoche=904\n",
      "Epsilon=0.818920 Action_times=2020046 Epoche=905\n",
      "Epsilon=0.818913 Action_times=2020133 Epoche=906\n",
      "Epsilon=0.818870 Action_times=2020667 Epoche=907\n",
      "Epsilon=0.818861 Action_times=2020782 Epoche=908\n",
      "Epsilon=0.818741 Action_times=2022260 Epoche=909\n",
      "Epsilon=0.818428 Action_times=2026137 Epoche=910\n",
      "Epsilon=0.818194 Action_times=2029031 Epoche=911\n",
      "Epsilon=0.818064 Action_times=2030636 Epoche=912\n",
      "Epsilon=0.817951 Action_times=2032030 Epoche=913\n",
      "Epsilon=0.817951 Action_times=2032038 Epoche=914\n",
      "Epsilon=0.817751 Action_times=2034506 Epoche=915\n",
      "Epsilon=0.817591 Action_times=2036494 Epoche=916\n",
      "Epsilon=0.817496 Action_times=2037674 Epoche=917\n",
      "Epsilon=0.817385 Action_times=2039048 Epoche=918\n",
      "Epsilon=0.817240 Action_times=2040842 Epoche=919\n",
      "Epsilon=0.817088 Action_times=2042724 Epoche=920\n",
      "Epsilon=0.817030 Action_times=2043437 Epoche=921\n",
      "Epsilon=0.816930 Action_times=2044677 Epoche=922\n",
      "Epsilon=0.816785 Action_times=2046482 Epoche=923\n",
      "Epsilon=0.816646 Action_times=2048205 Epoche=924\n",
      "Epsilon=0.816580 Action_times=2049018 Epoche=925\n",
      "Epsilon=0.816489 Action_times=2050150 Epoche=926\n",
      "Epsilon=0.816404 Action_times=2051206 Epoche=927\n",
      "Epsilon=0.816282 Action_times=2052712 Epoche=928\n",
      "Epsilon=0.816272 Action_times=2052832 Epoche=929\n",
      "Epsilon=0.816098 Action_times=2054998 Epoche=930\n",
      "Epsilon=0.816037 Action_times=2055748 Epoche=931\n",
      "Epsilon=0.815720 Action_times=2059686 Epoche=932\n",
      "Epsilon=0.815673 Action_times=2060265 Epoche=933\n",
      "Epsilon=0.815475 Action_times=2062731 Epoche=934\n",
      "Epsilon=0.815302 Action_times=2064879 Epoche=935\n",
      "Epsilon=0.815259 Action_times=2065410 Epoche=936\n",
      "Epsilon=0.815091 Action_times=2067501 Epoche=937\n",
      "Epsilon=0.815087 Action_times=2067551 Epoche=938\n",
      "Epsilon=0.814897 Action_times=2069912 Epoche=939\n",
      "Epsilon=0.814666 Action_times=2072771 Epoche=940\n",
      "Epsilon=0.814554 Action_times=2074170 Epoche=941\n",
      "Epsilon=0.814441 Action_times=2075572 Epoche=942\n",
      "Epsilon=0.814372 Action_times=2076435 Epoche=943\n",
      "Epsilon=0.814252 Action_times=2077917 Epoche=944\n",
      "Epsilon=0.814234 Action_times=2078151 Epoche=945\n",
      "Epsilon=0.814109 Action_times=2079704 Epoche=946\n",
      "Epsilon=0.813975 Action_times=2081373 Epoche=947\n",
      "Epsilon=0.813851 Action_times=2082910 Epoche=948\n",
      "Epsilon=0.813821 Action_times=2083282 Epoche=949\n",
      "Epsilon=0.813765 Action_times=2083985 Epoche=950\n",
      "Epsilon=0.813700 Action_times=2084786 Epoche=951\n",
      "Epsilon=0.813673 Action_times=2085127 Epoche=952\n",
      "Epsilon=0.813420 Action_times=2088273 Epoche=953\n",
      "Epsilon=0.813293 Action_times=2089859 Epoche=954\n",
      "Epsilon=0.813076 Action_times=2092557 Epoche=955\n",
      "Epsilon=0.812966 Action_times=2093922 Epoche=956\n",
      "Epsilon=0.812879 Action_times=2095014 Epoche=957\n",
      "Epsilon=0.812763 Action_times=2096456 Epoche=958\n",
      "Epsilon=0.812597 Action_times=2098525 Epoche=959\n",
      "Epsilon=0.812417 Action_times=2100767 Epoche=960\n",
      "Epsilon=0.812410 Action_times=2100848 Epoche=961\n",
      "Epsilon=0.812321 Action_times=2101959 Epoche=962\n",
      "Epsilon=0.812260 Action_times=2102726 Epoche=963\n",
      "Epsilon=0.812178 Action_times=2103740 Epoche=964\n",
      "Epsilon=0.812052 Action_times=2105311 Epoche=965\n",
      "Epsilon=0.811787 Action_times=2108624 Epoche=966\n",
      "Epsilon=0.811765 Action_times=2108893 Epoche=967\n",
      "Epsilon=0.811687 Action_times=2109873 Epoche=968\n",
      "Epsilon=0.811527 Action_times=2111869 Epoche=969\n",
      "Epsilon=0.811481 Action_times=2112437 Epoche=970\n",
      "Epsilon=0.811453 Action_times=2112789 Epoche=971\n",
      "Epsilon=0.811434 Action_times=2113026 Epoche=972\n",
      "Epsilon=0.811374 Action_times=2113770 Epoche=973\n",
      "Epsilon=0.811335 Action_times=2114262 Epoche=974\n",
      "Epsilon=0.811296 Action_times=2114744 Epoche=975\n",
      "Epsilon=0.811179 Action_times=2116200 Epoche=976\n",
      "Epsilon=0.811109 Action_times=2117075 Epoche=977\n",
      "Epsilon=0.811017 Action_times=2118232 Epoche=978\n",
      "Epsilon=0.810939 Action_times=2119207 Epoche=979\n",
      "Epsilon=0.810857 Action_times=2120223 Epoche=980\n",
      "Epsilon=0.810738 Action_times=2121712 Epoche=981\n",
      "Epsilon=0.810606 Action_times=2123358 Epoche=982\n",
      "Epsilon=0.810587 Action_times=2123598 Epoche=983\n",
      "Epsilon=0.810376 Action_times=2126232 Epoche=984\n",
      "Epsilon=0.810370 Action_times=2126309 Epoche=985\n",
      "Epsilon=0.810203 Action_times=2128401 Epoche=986\n",
      "Epsilon=0.810114 Action_times=2129511 Epoche=987\n",
      "Epsilon=0.810006 Action_times=2130855 Epoche=988\n",
      "Epsilon=0.809872 Action_times=2132529 Epoche=989\n",
      "Epsilon=0.809714 Action_times=2134506 Epoche=990\n",
      "Epsilon=0.809614 Action_times=2135759 Epoche=991\n",
      "Epsilon=0.809558 Action_times=2136455 Epoche=992\n",
      "Epsilon=0.809430 Action_times=2138057 Epoche=993\n",
      "Epsilon=0.809269 Action_times=2140080 Epoche=994\n",
      "Epsilon=0.809072 Action_times=2142545 Epoche=995\n",
      "Epsilon=0.808963 Action_times=2143904 Epoche=996\n",
      "Epsilon=0.808735 Action_times=2146763 Epoche=997\n",
      "Epsilon=0.808544 Action_times=2149148 Epoche=998\n",
      "Epsilon=0.808455 Action_times=2150260 Epoche=999\n",
      "Epsilon=0.808235 Action_times=2153018 Epoche=1000\n",
      "Epsilon=0.808111 Action_times=2154572 Epoche=1001\n",
      "Epsilon=0.807918 Action_times=2156995 Epoche=1002\n",
      "Epsilon=0.807696 Action_times=2159775 Epoche=1003\n",
      "Epsilon=0.807605 Action_times=2160912 Epoche=1004\n",
      "Epsilon=0.807487 Action_times=2162393 Epoche=1005\n",
      "Epsilon=0.807363 Action_times=2163950 Epoche=1006\n",
      "Epsilon=0.807094 Action_times=2167328 Epoche=1007\n",
      "Epsilon=0.807034 Action_times=2168077 Epoche=1008\n",
      "Epsilon=0.806804 Action_times=2170957 Epoche=1009\n",
      "Epsilon=0.806649 Action_times=2172908 Epoche=1010\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.806496 Action_times=2174833 Epoche=1011\n",
      "Epsilon=0.806361 Action_times=2176524 Epoche=1012\n",
      "Epsilon=0.806238 Action_times=2178073 Epoche=1013\n",
      "Epsilon=0.806109 Action_times=2179683 Epoche=1014\n",
      "Epsilon=0.805965 Action_times=2181500 Epoche=1015\n",
      "Epsilon=0.805732 Action_times=2184426 Epoche=1016\n",
      "Epsilon=0.805542 Action_times=2186815 Epoche=1017\n",
      "Epsilon=0.805507 Action_times=2187258 Epoche=1018\n",
      "Epsilon=0.805457 Action_times=2187878 Epoche=1019\n",
      "Epsilon=0.805318 Action_times=2189631 Epoche=1020\n",
      "Epsilon=0.805260 Action_times=2190363 Epoche=1021\n",
      "Epsilon=0.805123 Action_times=2192085 Epoche=1022\n",
      "Epsilon=0.805022 Action_times=2193352 Epoche=1023\n",
      "Epsilon=0.804973 Action_times=2193972 Epoche=1024\n",
      "Epsilon=0.804894 Action_times=2194963 Epoche=1025\n",
      "Epsilon=0.804840 Action_times=2195644 Epoche=1026\n",
      "Epsilon=0.804697 Action_times=2197445 Epoche=1027\n",
      "Epsilon=0.804500 Action_times=2199922 Epoche=1028\n",
      "Epsilon=0.804276 Action_times=2202745 Epoche=1029\n",
      "Epsilon=0.804242 Action_times=2203165 Epoche=1030\n",
      "Epsilon=0.804068 Action_times=2205364 Epoche=1031\n",
      "Epsilon=0.803953 Action_times=2206808 Epoche=1032\n",
      "Epsilon=0.803864 Action_times=2207933 Epoche=1033\n",
      "Epsilon=0.803837 Action_times=2208272 Epoche=1034\n",
      "Epsilon=0.803701 Action_times=2209976 Epoche=1035\n",
      "Epsilon=0.803682 Action_times=2210219 Epoche=1036\n",
      "Epsilon=0.803572 Action_times=2211605 Epoche=1037\n",
      "Epsilon=0.803334 Action_times=2214610 Epoche=1038\n",
      "Epsilon=0.803125 Action_times=2217242 Epoche=1039\n",
      "Epsilon=0.802815 Action_times=2221149 Epoche=1040\n",
      "Epsilon=0.802800 Action_times=2221338 Epoche=1041\n",
      "Epsilon=0.802697 Action_times=2222636 Epoche=1042\n",
      "Epsilon=0.802371 Action_times=2226746 Epoche=1043\n",
      "Epsilon=0.802263 Action_times=2228117 Epoche=1044\n",
      "Epsilon=0.802003 Action_times=2231392 Epoche=1045\n",
      "Epsilon=0.801952 Action_times=2232045 Epoche=1046\n",
      "Epsilon=0.801734 Action_times=2234793 Epoche=1047\n",
      "Epsilon=0.801540 Action_times=2237251 Epoche=1048\n",
      "Epsilon=0.801403 Action_times=2238978 Epoche=1049\n",
      "Epsilon=0.801297 Action_times=2240311 Epoche=1050\n",
      "Epsilon=0.801237 Action_times=2241079 Epoche=1051\n",
      "Epsilon=0.801040 Action_times=2243569 Epoche=1052\n",
      "Epsilon=0.800890 Action_times=2245455 Epoche=1053\n",
      "Epsilon=0.800748 Action_times=2247252 Epoche=1054\n",
      "Epsilon=0.800600 Action_times=2249130 Epoche=1055\n",
      "Epsilon=0.800356 Action_times=2252217 Epoche=1056\n",
      "Epsilon=0.800306 Action_times=2252843 Epoche=1057\n",
      "Epsilon=0.799985 Action_times=2256907 Epoche=1058\n",
      "Epsilon=0.799744 Action_times=2259964 Epoche=1059\n",
      "Epsilon=0.799654 Action_times=2261106 Epoche=1060\n",
      "Epsilon=0.799548 Action_times=2262448 Epoche=1061\n",
      "Epsilon=0.799436 Action_times=2263867 Epoche=1062\n",
      "Epsilon=0.799418 Action_times=2264091 Epoche=1063\n",
      "Epsilon=0.799222 Action_times=2266569 Epoche=1064\n",
      "Epsilon=0.799160 Action_times=2267364 Epoche=1065\n",
      "Epsilon=0.799109 Action_times=2268005 Epoche=1066\n",
      "Epsilon=0.798986 Action_times=2269562 Epoche=1067\n",
      "Epsilon=0.798913 Action_times=2270485 Epoche=1068\n",
      "Epsilon=0.798773 Action_times=2272259 Epoche=1069\n",
      "Epsilon=0.798668 Action_times=2273601 Epoche=1070\n",
      "Epsilon=0.798492 Action_times=2275822 Epoche=1071\n",
      "Epsilon=0.798346 Action_times=2277678 Epoche=1072\n",
      "Epsilon=0.798339 Action_times=2277764 Epoche=1073\n",
      "Epsilon=0.798193 Action_times=2279614 Epoche=1074\n",
      "Epsilon=0.797994 Action_times=2282141 Epoche=1075\n",
      "Epsilon=0.797854 Action_times=2283918 Epoche=1076\n",
      "Epsilon=0.797797 Action_times=2284648 Epoche=1077\n",
      "Epsilon=0.797714 Action_times=2285695 Epoche=1078\n",
      "Epsilon=0.797555 Action_times=2287713 Epoche=1079\n",
      "Epsilon=0.797377 Action_times=2289979 Epoche=1080\n",
      "Epsilon=0.797264 Action_times=2291408 Epoche=1081\n",
      "Epsilon=0.797091 Action_times=2293617 Epoche=1082\n",
      "Epsilon=0.796959 Action_times=2295294 Epoche=1083\n",
      "Epsilon=0.796896 Action_times=2296092 Epoche=1084\n",
      "Epsilon=0.796888 Action_times=2296189 Epoche=1085\n",
      "Epsilon=0.796693 Action_times=2298672 Epoche=1086\n",
      "Epsilon=0.796633 Action_times=2299434 Epoche=1087\n",
      "Epsilon=0.796417 Action_times=2302180 Epoche=1088\n",
      "Epsilon=0.796216 Action_times=2304729 Epoche=1089\n",
      "Epsilon=0.796034 Action_times=2307047 Epoche=1090\n",
      "Epsilon=0.795877 Action_times=2309048 Epoche=1091\n",
      "Epsilon=0.795801 Action_times=2310008 Epoche=1092\n",
      "Epsilon=0.795698 Action_times=2311326 Epoche=1093\n",
      "Epsilon=0.795622 Action_times=2312292 Epoche=1094\n",
      "Epsilon=0.795491 Action_times=2313964 Epoche=1095\n",
      "Epsilon=0.795407 Action_times=2315024 Epoche=1096\n",
      "Epsilon=0.795302 Action_times=2316362 Epoche=1097\n",
      "Epsilon=0.795203 Action_times=2317621 Epoche=1098\n",
      "Epsilon=0.795004 Action_times=2320158 Epoche=1099\n",
      "Epsilon=0.794879 Action_times=2321753 Epoche=1100\n",
      "Epsilon=0.794843 Action_times=2322216 Epoche=1101\n",
      "Epsilon=0.794716 Action_times=2323828 Epoche=1102\n",
      "Epsilon=0.794679 Action_times=2324299 Epoche=1103\n",
      "Epsilon=0.794608 Action_times=2325213 Epoche=1104\n",
      "Epsilon=0.794550 Action_times=2325949 Epoche=1105\n",
      "Epsilon=0.794548 Action_times=2325973 Epoche=1106\n",
      "Epsilon=0.794447 Action_times=2327253 Epoche=1107\n",
      "Epsilon=0.794425 Action_times=2327544 Epoche=1108\n",
      "Epsilon=0.794320 Action_times=2328873 Epoche=1109\n",
      "Epsilon=0.794197 Action_times=2330444 Epoche=1110\n",
      "Epsilon=0.794150 Action_times=2331046 Epoche=1111\n",
      "Epsilon=0.794043 Action_times=2332416 Epoche=1112\n",
      "Epsilon=0.793979 Action_times=2333226 Epoche=1113\n",
      "Epsilon=0.793921 Action_times=2333965 Epoche=1114\n",
      "Epsilon=0.793643 Action_times=2337508 Epoche=1115\n",
      "Epsilon=0.793409 Action_times=2340494 Epoche=1116\n",
      "Epsilon=0.793265 Action_times=2342345 Epoche=1117\n",
      "Epsilon=0.793246 Action_times=2342584 Epoche=1118\n",
      "Epsilon=0.793045 Action_times=2345148 Epoche=1119\n",
      "Epsilon=0.792985 Action_times=2345909 Epoche=1120\n",
      "Epsilon=0.792924 Action_times=2346699 Epoche=1121\n",
      "Epsilon=0.792790 Action_times=2348405 Epoche=1122\n",
      "Epsilon=0.792765 Action_times=2348723 Epoche=1123\n",
      "Epsilon=0.792657 Action_times=2350103 Epoche=1124\n",
      "Epsilon=0.792538 Action_times=2351624 Epoche=1125\n",
      "Epsilon=0.792439 Action_times=2352892 Epoche=1126\n",
      "Epsilon=0.792333 Action_times=2354246 Epoche=1127\n",
      "Epsilon=0.792202 Action_times=2355919 Epoche=1128\n",
      "Epsilon=0.792060 Action_times=2357729 Epoche=1129\n",
      "Epsilon=0.791922 Action_times=2359496 Epoche=1130\n",
      "Epsilon=0.791847 Action_times=2360459 Epoche=1131\n",
      "Epsilon=0.791773 Action_times=2361401 Epoche=1132\n",
      "Epsilon=0.791732 Action_times=2361931 Epoche=1133\n",
      "Epsilon=0.791672 Action_times=2362694 Epoche=1134\n",
      "Epsilon=0.791562 Action_times=2364103 Epoche=1135\n",
      "Epsilon=0.791471 Action_times=2365268 Epoche=1136\n",
      "Epsilon=0.791398 Action_times=2366208 Epoche=1137\n",
      "Epsilon=0.791286 Action_times=2367638 Epoche=1138\n",
      "Epsilon=0.791138 Action_times=2369536 Epoche=1139\n",
      "Epsilon=0.791081 Action_times=2370255 Epoche=1140\n",
      "Epsilon=0.791037 Action_times=2370830 Epoche=1141\n",
      "Epsilon=0.790892 Action_times=2372678 Epoche=1142\n",
      "Epsilon=0.790823 Action_times=2373568 Epoche=1143\n",
      "Epsilon=0.790649 Action_times=2375787 Epoche=1144\n",
      "Epsilon=0.790538 Action_times=2377212 Epoche=1145\n",
      "Epsilon=0.790259 Action_times=2380784 Epoche=1146\n",
      "Epsilon=0.790001 Action_times=2384093 Epoche=1147\n",
      "Epsilon=0.789904 Action_times=2385341 Epoche=1148\n",
      "Epsilon=0.789679 Action_times=2388232 Epoche=1149\n",
      "Epsilon=0.789578 Action_times=2389522 Epoche=1150\n",
      "Epsilon=0.789470 Action_times=2390905 Epoche=1151\n",
      "Epsilon=0.789350 Action_times=2392449 Epoche=1152\n",
      "Epsilon=0.789123 Action_times=2395364 Epoche=1153\n",
      "Epsilon=0.789071 Action_times=2396029 Epoche=1154\n",
      "Epsilon=0.788941 Action_times=2397701 Epoche=1155\n",
      "Epsilon=0.788908 Action_times=2398122 Epoche=1156\n",
      "Epsilon=0.788703 Action_times=2400750 Epoche=1157\n",
      "Epsilon=0.788551 Action_times=2402710 Epoche=1158\n",
      "Epsilon=0.788355 Action_times=2405225 Epoche=1159\n",
      "Epsilon=0.788298 Action_times=2405959 Epoche=1160\n",
      "Epsilon=0.788277 Action_times=2406226 Epoche=1161\n",
      "Epsilon=0.788197 Action_times=2407248 Epoche=1162\n",
      "Epsilon=0.788050 Action_times=2409145 Epoche=1163\n",
      "Epsilon=0.787868 Action_times=2411475 Epoche=1164\n",
      "Epsilon=0.787478 Action_times=2416494 Epoche=1165\n",
      "Epsilon=0.787453 Action_times=2416822 Epoche=1166\n",
      "Epsilon=0.787310 Action_times=2418660 Epoche=1167\n",
      "Epsilon=0.787062 Action_times=2421845 Epoche=1168\n",
      "Epsilon=0.786992 Action_times=2422748 Epoche=1169\n",
      "Epsilon=0.786783 Action_times=2425441 Epoche=1170\n",
      "Epsilon=0.786608 Action_times=2427687 Epoche=1171\n",
      "Epsilon=0.786532 Action_times=2428665 Epoche=1172\n",
      "Epsilon=0.786231 Action_times=2432549 Epoche=1173\n",
      "Epsilon=0.786122 Action_times=2433946 Epoche=1174\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.785995 Action_times=2435587 Epoche=1175\n",
      "Epsilon=0.785566 Action_times=2441119 Epoche=1176\n",
      "Epsilon=0.785444 Action_times=2442687 Epoche=1177\n",
      "Epsilon=0.785257 Action_times=2445110 Epoche=1178\n",
      "Epsilon=0.785035 Action_times=2447969 Epoche=1179\n",
      "Epsilon=0.784937 Action_times=2449237 Epoche=1180\n",
      "Epsilon=0.784906 Action_times=2449629 Epoche=1181\n",
      "Epsilon=0.784730 Action_times=2451903 Epoche=1182\n",
      "Epsilon=0.784627 Action_times=2453237 Epoche=1183\n",
      "Epsilon=0.784590 Action_times=2453707 Epoche=1184\n",
      "Epsilon=0.784427 Action_times=2455818 Epoche=1185\n",
      "Epsilon=0.784344 Action_times=2456887 Epoche=1186\n",
      "Epsilon=0.784203 Action_times=2458713 Epoche=1187\n",
      "Epsilon=0.784102 Action_times=2460019 Epoche=1188\n",
      "Epsilon=0.783906 Action_times=2462541 Epoche=1189\n",
      "Epsilon=0.783845 Action_times=2463335 Epoche=1190\n",
      "Epsilon=0.783695 Action_times=2465276 Epoche=1191\n",
      "Epsilon=0.783563 Action_times=2466981 Epoche=1192\n",
      "Epsilon=0.783489 Action_times=2467936 Epoche=1193\n",
      "Epsilon=0.783475 Action_times=2468122 Epoche=1194\n",
      "Epsilon=0.783411 Action_times=2468945 Epoche=1195\n",
      "Epsilon=0.783394 Action_times=2469165 Epoche=1196\n",
      "Epsilon=0.783335 Action_times=2469924 Epoche=1197\n",
      "Epsilon=0.783212 Action_times=2471516 Epoche=1198\n",
      "Epsilon=0.783050 Action_times=2473613 Epoche=1199\n",
      "Epsilon=0.783002 Action_times=2474233 Epoche=1200\n",
      "Epsilon=0.782902 Action_times=2475521 Epoche=1201\n",
      "Epsilon=0.782641 Action_times=2478901 Epoche=1202\n",
      "Epsilon=0.782428 Action_times=2481662 Epoche=1203\n",
      "Epsilon=0.782379 Action_times=2482294 Epoche=1204\n",
      "Epsilon=0.782327 Action_times=2482968 Epoche=1205\n",
      "Epsilon=0.782242 Action_times=2484064 Epoche=1206\n",
      "Epsilon=0.781970 Action_times=2487594 Epoche=1207\n",
      "Epsilon=0.781728 Action_times=2490728 Epoche=1208\n",
      "Epsilon=0.781660 Action_times=2491615 Epoche=1209\n",
      "Epsilon=0.781424 Action_times=2494669 Epoche=1210\n",
      "Epsilon=0.781395 Action_times=2495042 Epoche=1211\n",
      "Epsilon=0.781281 Action_times=2496524 Epoche=1212\n",
      "Epsilon=0.781229 Action_times=2497191 Epoche=1213\n",
      "Epsilon=0.780994 Action_times=2500242 Epoche=1214\n",
      "Epsilon=0.780967 Action_times=2500595 Epoche=1215\n",
      "Epsilon=0.780827 Action_times=2502408 Epoche=1216\n",
      "Epsilon=0.780798 Action_times=2502783 Epoche=1217\n",
      "Epsilon=0.780627 Action_times=2505002 Epoche=1218\n",
      "Epsilon=0.780423 Action_times=2507647 Epoche=1219\n",
      "Epsilon=0.780150 Action_times=2511199 Epoche=1220\n",
      "Epsilon=0.780003 Action_times=2513104 Epoche=1221\n",
      "Epsilon=0.779938 Action_times=2513954 Epoche=1222\n",
      "Epsilon=0.779893 Action_times=2514535 Epoche=1223\n",
      "Epsilon=0.779787 Action_times=2515905 Epoche=1224\n",
      "Epsilon=0.779637 Action_times=2517856 Epoche=1225\n",
      "Epsilon=0.779387 Action_times=2521103 Epoche=1226\n",
      "Epsilon=0.779256 Action_times=2522811 Epoche=1227\n",
      "Epsilon=0.779175 Action_times=2523859 Epoche=1228\n",
      "Epsilon=0.779095 Action_times=2524899 Epoche=1229\n",
      "Epsilon=0.779010 Action_times=2526005 Epoche=1230\n",
      "Epsilon=0.778926 Action_times=2527104 Epoche=1231\n",
      "Epsilon=0.778861 Action_times=2527944 Epoche=1232\n",
      "Epsilon=0.778761 Action_times=2529250 Epoche=1233\n",
      "Epsilon=0.778680 Action_times=2530300 Epoche=1234\n",
      "Epsilon=0.778618 Action_times=2531106 Epoche=1235\n",
      "Epsilon=0.778477 Action_times=2532937 Epoche=1236\n",
      "Epsilon=0.778374 Action_times=2534284 Epoche=1237\n",
      "Epsilon=0.778346 Action_times=2534644 Epoche=1238\n",
      "Epsilon=0.778324 Action_times=2534935 Epoche=1239\n",
      "Epsilon=0.778202 Action_times=2536516 Epoche=1240\n",
      "Epsilon=0.778083 Action_times=2538072 Epoche=1241\n",
      "Epsilon=0.778050 Action_times=2538497 Epoche=1242\n",
      "Epsilon=0.777980 Action_times=2539417 Epoche=1243\n",
      "Epsilon=0.777833 Action_times=2541327 Epoche=1244\n",
      "Epsilon=0.777759 Action_times=2542295 Epoche=1245\n",
      "Epsilon=0.777667 Action_times=2543485 Epoche=1246\n",
      "Epsilon=0.777601 Action_times=2544350 Epoche=1247\n",
      "Epsilon=0.777508 Action_times=2545565 Epoche=1248\n",
      "Epsilon=0.777302 Action_times=2548244 Epoche=1249\n",
      "Epsilon=0.777244 Action_times=2549006 Epoche=1250\n",
      "Epsilon=0.777110 Action_times=2550743 Epoche=1251\n",
      "Epsilon=0.777040 Action_times=2551662 Epoche=1252\n",
      "Epsilon=0.776957 Action_times=2552745 Epoche=1253\n",
      "Epsilon=0.776627 Action_times=2557044 Epoche=1254\n",
      "Epsilon=0.776441 Action_times=2559473 Epoche=1255\n",
      "Epsilon=0.776352 Action_times=2560634 Epoche=1256\n",
      "Epsilon=0.776277 Action_times=2561610 Epoche=1257\n",
      "Epsilon=0.776110 Action_times=2563791 Epoche=1258\n",
      "Epsilon=0.776086 Action_times=2564103 Epoche=1259\n",
      "Epsilon=0.775849 Action_times=2567200 Epoche=1260\n",
      "Epsilon=0.775769 Action_times=2568238 Epoche=1261\n",
      "Epsilon=0.775595 Action_times=2570511 Epoche=1262\n",
      "Epsilon=0.775493 Action_times=2571849 Epoche=1263\n",
      "Epsilon=0.775392 Action_times=2573172 Epoche=1264\n",
      "Epsilon=0.775280 Action_times=2574630 Epoche=1265\n",
      "Epsilon=0.775271 Action_times=2574743 Epoche=1266\n",
      "Epsilon=0.775227 Action_times=2575322 Epoche=1267\n",
      "Epsilon=0.775114 Action_times=2576797 Epoche=1268\n",
      "Epsilon=0.775045 Action_times=2577701 Epoche=1269\n",
      "Epsilon=0.774989 Action_times=2578439 Epoche=1270\n",
      "Epsilon=0.774903 Action_times=2579561 Epoche=1271\n",
      "Epsilon=0.774685 Action_times=2582405 Epoche=1272\n",
      "Epsilon=0.774600 Action_times=2583519 Epoche=1273\n",
      "Epsilon=0.774322 Action_times=2587160 Epoche=1274\n",
      "Epsilon=0.774182 Action_times=2588994 Epoche=1275\n",
      "Epsilon=0.774069 Action_times=2590466 Epoche=1276\n",
      "Epsilon=0.774038 Action_times=2590869 Epoche=1277\n",
      "Epsilon=0.773955 Action_times=2591956 Epoche=1278\n",
      "Epsilon=0.773921 Action_times=2592404 Epoche=1279\n",
      "Epsilon=0.773893 Action_times=2592777 Epoche=1280\n",
      "Epsilon=0.773786 Action_times=2594172 Epoche=1281\n",
      "Epsilon=0.773719 Action_times=2595048 Epoche=1282\n",
      "Epsilon=0.773597 Action_times=2596645 Epoche=1283\n",
      "Epsilon=0.773574 Action_times=2596943 Epoche=1284\n",
      "Epsilon=0.773550 Action_times=2597260 Epoche=1285\n",
      "Epsilon=0.773517 Action_times=2597692 Epoche=1286\n",
      "Epsilon=0.773417 Action_times=2599002 Epoche=1287\n",
      "Epsilon=0.773400 Action_times=2599222 Epoche=1288\n",
      "Epsilon=0.773240 Action_times=2601330 Epoche=1289\n",
      "Epsilon=0.773128 Action_times=2602793 Epoche=1290\n",
      "Epsilon=0.773006 Action_times=2604388 Epoche=1291\n",
      "Epsilon=0.772933 Action_times=2605349 Epoche=1292\n",
      "Epsilon=0.772890 Action_times=2605917 Epoche=1293\n",
      "Epsilon=0.772830 Action_times=2606691 Epoche=1294\n",
      "Epsilon=0.772761 Action_times=2607597 Epoche=1295\n",
      "Epsilon=0.772657 Action_times=2608972 Epoche=1296\n",
      "Epsilon=0.772561 Action_times=2610226 Epoche=1297\n",
      "Epsilon=0.772423 Action_times=2612032 Epoche=1298\n",
      "Epsilon=0.772326 Action_times=2613301 Epoche=1299\n",
      "Epsilon=0.772233 Action_times=2614524 Epoche=1300\n",
      "Epsilon=0.772132 Action_times=2615849 Epoche=1301\n",
      "Epsilon=0.772050 Action_times=2616931 Epoche=1302\n",
      "Epsilon=0.771933 Action_times=2618462 Epoche=1303\n",
      "Epsilon=0.771840 Action_times=2619683 Epoche=1304\n",
      "Epsilon=0.771748 Action_times=2620885 Epoche=1305\n",
      "Epsilon=0.771739 Action_times=2621004 Epoche=1306\n",
      "Epsilon=0.771694 Action_times=2621599 Epoche=1307\n",
      "Epsilon=0.771656 Action_times=2622105 Epoche=1308\n",
      "Epsilon=0.771548 Action_times=2623523 Epoche=1309\n",
      "Epsilon=0.771429 Action_times=2625075 Epoche=1310\n",
      "Epsilon=0.771418 Action_times=2625220 Epoche=1311\n",
      "Epsilon=0.771373 Action_times=2625816 Epoche=1312\n",
      "Epsilon=0.771301 Action_times=2626763 Epoche=1313\n",
      "Epsilon=0.771179 Action_times=2628359 Epoche=1314\n",
      "Epsilon=0.771101 Action_times=2629394 Epoche=1315\n",
      "Epsilon=0.771048 Action_times=2630083 Epoche=1316\n",
      "Epsilon=0.770815 Action_times=2633150 Epoche=1317\n",
      "Epsilon=0.770668 Action_times=2635077 Epoche=1318\n",
      "Epsilon=0.770438 Action_times=2638102 Epoche=1319\n",
      "Epsilon=0.770333 Action_times=2639491 Epoche=1320\n",
      "Epsilon=0.770258 Action_times=2640467 Epoche=1321\n",
      "Epsilon=0.770231 Action_times=2640831 Epoche=1322\n",
      "Epsilon=0.769913 Action_times=2645009 Epoche=1323\n",
      "Epsilon=0.769816 Action_times=2646290 Epoche=1324\n",
      "Epsilon=0.769706 Action_times=2647730 Epoche=1325\n",
      "Epsilon=0.769564 Action_times=2649610 Epoche=1326\n",
      "Epsilon=0.769528 Action_times=2650083 Epoche=1327\n",
      "Epsilon=0.769450 Action_times=2651110 Epoche=1328\n",
      "Epsilon=0.769366 Action_times=2652213 Epoche=1329\n",
      "Epsilon=0.769257 Action_times=2653652 Epoche=1330\n",
      "Epsilon=0.769176 Action_times=2654719 Epoche=1331\n",
      "Epsilon=0.769017 Action_times=2656802 Epoche=1332\n",
      "Epsilon=0.768846 Action_times=2659056 Epoche=1333\n",
      "Epsilon=0.768808 Action_times=2659567 Epoche=1334\n",
      "Epsilon=0.768767 Action_times=2660098 Epoche=1335\n",
      "Epsilon=0.768663 Action_times=2661476 Epoche=1336\n",
      "Epsilon=0.768654 Action_times=2661594 Epoche=1337\n",
      "Epsilon=0.768589 Action_times=2662453 Epoche=1338\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.768544 Action_times=2663035 Epoche=1339\n",
      "Epsilon=0.768465 Action_times=2664081 Epoche=1340\n",
      "Epsilon=0.768417 Action_times=2664715 Epoche=1341\n",
      "Epsilon=0.768380 Action_times=2665204 Epoche=1342\n",
      "Epsilon=0.768311 Action_times=2666113 Epoche=1343\n",
      "Epsilon=0.768224 Action_times=2667263 Epoche=1344\n",
      "Epsilon=0.768218 Action_times=2667339 Epoche=1345\n",
      "Epsilon=0.768124 Action_times=2668586 Epoche=1346\n",
      "Epsilon=0.767946 Action_times=2670928 Epoche=1347\n",
      "Epsilon=0.767834 Action_times=2672402 Epoche=1348\n",
      "Epsilon=0.767710 Action_times=2674044 Epoche=1349\n",
      "Epsilon=0.767583 Action_times=2675715 Epoche=1350\n",
      "Epsilon=0.767513 Action_times=2676648 Epoche=1351\n",
      "Epsilon=0.767328 Action_times=2679085 Epoche=1352\n",
      "Epsilon=0.767122 Action_times=2681804 Epoche=1353\n",
      "Epsilon=0.767052 Action_times=2682735 Epoche=1354\n",
      "Epsilon=0.767046 Action_times=2682809 Epoche=1355\n",
      "Epsilon=0.766907 Action_times=2684650 Epoche=1356\n",
      "Epsilon=0.766846 Action_times=2685449 Epoche=1357\n",
      "Epsilon=0.766761 Action_times=2686579 Epoche=1358\n",
      "Epsilon=0.766682 Action_times=2687619 Epoche=1359\n",
      "Epsilon=0.766524 Action_times=2689710 Epoche=1360\n",
      "Epsilon=0.766466 Action_times=2690476 Epoche=1361\n",
      "Epsilon=0.766353 Action_times=2691965 Epoche=1362\n",
      "Epsilon=0.766116 Action_times=2695106 Epoche=1363\n",
      "Epsilon=0.766042 Action_times=2696075 Epoche=1364\n",
      "Epsilon=0.765894 Action_times=2698034 Epoche=1365\n",
      "Epsilon=0.765836 Action_times=2698804 Epoche=1366\n",
      "Epsilon=0.765711 Action_times=2700459 Epoche=1367\n",
      "Epsilon=0.765673 Action_times=2700966 Epoche=1368\n",
      "Epsilon=0.765564 Action_times=2702398 Epoche=1369\n",
      "Epsilon=0.765478 Action_times=2703538 Epoche=1370\n",
      "Epsilon=0.765411 Action_times=2704426 Epoche=1371\n",
      "Epsilon=0.765298 Action_times=2705927 Epoche=1372\n",
      "Epsilon=0.765261 Action_times=2706415 Epoche=1373\n",
      "Epsilon=0.765213 Action_times=2707055 Epoche=1374\n",
      "Epsilon=0.765162 Action_times=2707730 Epoche=1375\n",
      "Epsilon=0.765027 Action_times=2709516 Epoche=1376\n",
      "Epsilon=0.764812 Action_times=2712358 Epoche=1377\n",
      "Epsilon=0.764797 Action_times=2712564 Epoche=1378\n",
      "Epsilon=0.764780 Action_times=2712785 Epoche=1379\n",
      "Epsilon=0.764684 Action_times=2714063 Epoche=1380\n",
      "Epsilon=0.764649 Action_times=2714523 Epoche=1381\n",
      "Epsilon=0.764461 Action_times=2717020 Epoche=1382\n",
      "Epsilon=0.764372 Action_times=2718188 Epoche=1383\n",
      "Epsilon=0.764108 Action_times=2721700 Epoche=1384\n",
      "Epsilon=0.764019 Action_times=2722875 Epoche=1385\n",
      "Epsilon=0.763828 Action_times=2725403 Epoche=1386\n",
      "Epsilon=0.763535 Action_times=2729291 Epoche=1387\n",
      "Epsilon=0.763426 Action_times=2730735 Epoche=1388\n",
      "Epsilon=0.763315 Action_times=2732221 Epoche=1389\n",
      "Epsilon=0.763144 Action_times=2734486 Epoche=1390\n",
      "Epsilon=0.762974 Action_times=2736739 Epoche=1391\n",
      "Epsilon=0.762949 Action_times=2737073 Epoche=1392\n",
      "Epsilon=0.762868 Action_times=2738149 Epoche=1393\n",
      "Epsilon=0.762821 Action_times=2738775 Epoche=1394\n",
      "Epsilon=0.762701 Action_times=2740369 Epoche=1395\n",
      "Epsilon=0.762662 Action_times=2740892 Epoche=1396\n",
      "Epsilon=0.762619 Action_times=2741452 Epoche=1397\n",
      "Epsilon=0.762392 Action_times=2744480 Epoche=1398\n",
      "Epsilon=0.762295 Action_times=2745769 Epoche=1399\n",
      "Epsilon=0.762292 Action_times=2745806 Epoche=1400\n",
      "Epsilon=0.762074 Action_times=2748703 Epoche=1401\n",
      "Epsilon=0.761957 Action_times=2750264 Epoche=1402\n",
      "Epsilon=0.761842 Action_times=2751793 Epoche=1403\n",
      "Epsilon=0.761687 Action_times=2753846 Epoche=1404\n",
      "Epsilon=0.761609 Action_times=2754891 Epoche=1405\n",
      "Epsilon=0.761508 Action_times=2756225 Epoche=1406\n",
      "Epsilon=0.761367 Action_times=2758110 Epoche=1407\n",
      "Epsilon=0.761280 Action_times=2759270 Epoche=1408\n",
      "Epsilon=0.761233 Action_times=2759894 Epoche=1409\n",
      "Epsilon=0.761063 Action_times=2762158 Epoche=1410\n",
      "Epsilon=0.760941 Action_times=2763781 Epoche=1411\n",
      "Epsilon=0.760775 Action_times=2765995 Epoche=1412\n",
      "Epsilon=0.760723 Action_times=2766681 Epoche=1413\n",
      "Epsilon=0.760620 Action_times=2768057 Epoche=1414\n",
      "Epsilon=0.760391 Action_times=2771104 Epoche=1415\n",
      "Epsilon=0.760204 Action_times=2773594 Epoche=1416\n",
      "Epsilon=0.760196 Action_times=2773703 Epoche=1417\n",
      "Epsilon=0.760038 Action_times=2775810 Epoche=1418\n",
      "Epsilon=0.759874 Action_times=2778002 Epoche=1419\n",
      "Epsilon=0.759823 Action_times=2778675 Epoche=1420\n",
      "Epsilon=0.759690 Action_times=2780452 Epoche=1421\n",
      "Epsilon=0.759569 Action_times=2782062 Epoche=1422\n",
      "Epsilon=0.759398 Action_times=2784343 Epoche=1423\n",
      "Epsilon=0.759325 Action_times=2785317 Epoche=1424\n",
      "Epsilon=0.759303 Action_times=2785613 Epoche=1425\n",
      "Epsilon=0.759287 Action_times=2785824 Epoche=1426\n",
      "Epsilon=0.759260 Action_times=2786193 Epoche=1427\n",
      "Epsilon=0.759242 Action_times=2786434 Epoche=1428\n",
      "Epsilon=0.759157 Action_times=2787561 Epoche=1429\n",
      "Epsilon=0.759122 Action_times=2788037 Epoche=1430\n",
      "Epsilon=0.759023 Action_times=2789346 Epoche=1431\n",
      "Epsilon=0.758916 Action_times=2790782 Epoche=1432\n",
      "Epsilon=0.758897 Action_times=2791038 Epoche=1433\n",
      "Epsilon=0.758851 Action_times=2791655 Epoche=1434\n",
      "Epsilon=0.758788 Action_times=2792495 Epoche=1435\n",
      "Epsilon=0.758596 Action_times=2795049 Epoche=1436\n",
      "Epsilon=0.758547 Action_times=2795709 Epoche=1437\n",
      "Epsilon=0.758472 Action_times=2796708 Epoche=1438\n",
      "Epsilon=0.758393 Action_times=2797770 Epoche=1439\n",
      "Epsilon=0.758274 Action_times=2799363 Epoche=1440\n",
      "Epsilon=0.758208 Action_times=2800245 Epoche=1441\n",
      "Epsilon=0.758024 Action_times=2802693 Epoche=1442\n",
      "Epsilon=0.757954 Action_times=2803641 Epoche=1443\n",
      "Epsilon=0.757898 Action_times=2804390 Epoche=1444\n",
      "Epsilon=0.757745 Action_times=2806436 Epoche=1445\n",
      "Epsilon=0.757623 Action_times=2808066 Epoche=1446\n",
      "Epsilon=0.757596 Action_times=2808420 Epoche=1447\n",
      "Epsilon=0.757490 Action_times=2809845 Epoche=1448\n",
      "Epsilon=0.757469 Action_times=2810118 Epoche=1449\n",
      "Epsilon=0.757434 Action_times=2810591 Epoche=1450\n",
      "Epsilon=0.757374 Action_times=2811388 Epoche=1451\n",
      "Epsilon=0.757365 Action_times=2811513 Epoche=1452\n",
      "Epsilon=0.757291 Action_times=2812509 Epoche=1453\n",
      "Epsilon=0.757131 Action_times=2814638 Epoche=1454\n",
      "Epsilon=0.757053 Action_times=2815694 Epoche=1455\n",
      "Epsilon=0.756937 Action_times=2817245 Epoche=1456\n",
      "Epsilon=0.756797 Action_times=2819109 Epoche=1457\n",
      "Epsilon=0.756690 Action_times=2820550 Epoche=1458\n",
      "Epsilon=0.756593 Action_times=2821850 Epoche=1459\n",
      "Epsilon=0.756526 Action_times=2822740 Epoche=1460\n",
      "Epsilon=0.756516 Action_times=2822879 Epoche=1461\n",
      "Epsilon=0.756460 Action_times=2823629 Epoche=1462\n",
      "Epsilon=0.756378 Action_times=2824726 Epoche=1463\n",
      "Epsilon=0.756280 Action_times=2826044 Epoche=1464\n",
      "Epsilon=0.756176 Action_times=2827432 Epoche=1465\n",
      "Epsilon=0.756122 Action_times=2828156 Epoche=1466\n",
      "Epsilon=0.755992 Action_times=2829898 Epoche=1467\n",
      "Epsilon=0.755726 Action_times=2833464 Epoche=1468\n",
      "Epsilon=0.755624 Action_times=2834837 Epoche=1469\n",
      "Epsilon=0.755594 Action_times=2835243 Epoche=1470\n",
      "Epsilon=0.755529 Action_times=2836108 Epoche=1471\n",
      "Epsilon=0.755455 Action_times=2837104 Epoche=1472\n",
      "Epsilon=0.755408 Action_times=2837733 Epoche=1473\n",
      "Epsilon=0.755279 Action_times=2839463 Epoche=1474\n",
      "Epsilon=0.755174 Action_times=2840870 Epoche=1475\n",
      "Epsilon=0.755095 Action_times=2841933 Epoche=1476\n",
      "Epsilon=0.754953 Action_times=2843842 Epoche=1477\n",
      "Epsilon=0.754789 Action_times=2846042 Epoche=1478\n",
      "Epsilon=0.754663 Action_times=2847734 Epoche=1479\n",
      "Epsilon=0.754580 Action_times=2848846 Epoche=1480\n",
      "Epsilon=0.754545 Action_times=2849317 Epoche=1481\n",
      "Epsilon=0.754439 Action_times=2850735 Epoche=1482\n",
      "Epsilon=0.754300 Action_times=2852614 Epoche=1483\n",
      "Epsilon=0.754226 Action_times=2853604 Epoche=1484\n",
      "Epsilon=0.754172 Action_times=2854323 Epoche=1485\n",
      "Epsilon=0.753960 Action_times=2857176 Epoche=1486\n",
      "Epsilon=0.753929 Action_times=2857590 Epoche=1487\n",
      "Epsilon=0.753760 Action_times=2859871 Epoche=1488\n",
      "Epsilon=0.753716 Action_times=2860458 Epoche=1489\n",
      "Epsilon=0.753640 Action_times=2861484 Epoche=1490\n",
      "Epsilon=0.753599 Action_times=2862024 Epoche=1491\n",
      "Epsilon=0.753558 Action_times=2862586 Epoche=1492\n",
      "Epsilon=0.753536 Action_times=2862879 Epoche=1493\n",
      "Epsilon=0.753480 Action_times=2863629 Epoche=1494\n",
      "Epsilon=0.753396 Action_times=2864755 Epoche=1495\n",
      "Epsilon=0.753246 Action_times=2866773 Epoche=1496\n",
      "Epsilon=0.753142 Action_times=2868180 Epoche=1497\n",
      "Epsilon=0.753022 Action_times=2869793 Epoche=1498\n",
      "Epsilon=0.752933 Action_times=2870993 Epoche=1499\n",
      "Epsilon=0.752887 Action_times=2871610 Epoche=1500\n",
      "Epsilon=0.752842 Action_times=2872219 Epoche=1501\n",
      "Epsilon=0.752731 Action_times=2873705 Epoche=1502\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.752656 Action_times=2874717 Epoche=1503\n",
      "Epsilon=0.752511 Action_times=2876675 Epoche=1504\n",
      "Epsilon=0.752428 Action_times=2877785 Epoche=1505\n",
      "Epsilon=0.752351 Action_times=2878830 Epoche=1506\n",
      "Epsilon=0.752299 Action_times=2879527 Epoche=1507\n",
      "Epsilon=0.752247 Action_times=2880227 Epoche=1508\n",
      "Epsilon=0.752224 Action_times=2880543 Epoche=1509\n",
      "Epsilon=0.752168 Action_times=2881289 Epoche=1510\n",
      "Epsilon=0.752046 Action_times=2882943 Epoche=1511\n",
      "Epsilon=0.751948 Action_times=2884257 Epoche=1512\n",
      "Epsilon=0.751860 Action_times=2885449 Epoche=1513\n",
      "Epsilon=0.751844 Action_times=2885655 Epoche=1514\n",
      "Epsilon=0.751790 Action_times=2886383 Epoche=1515\n",
      "Epsilon=0.751692 Action_times=2887715 Epoche=1516\n",
      "Epsilon=0.751673 Action_times=2887967 Epoche=1517\n",
      "Epsilon=0.751581 Action_times=2889201 Epoche=1518\n",
      "Epsilon=0.751541 Action_times=2889747 Epoche=1519\n",
      "Epsilon=0.751388 Action_times=2891815 Epoche=1520\n",
      "Epsilon=0.751231 Action_times=2893930 Epoche=1521\n",
      "Epsilon=0.751062 Action_times=2896211 Epoche=1522\n",
      "Epsilon=0.751021 Action_times=2896754 Epoche=1523\n",
      "Epsilon=0.751011 Action_times=2896894 Epoche=1524\n",
      "Epsilon=0.750915 Action_times=2898194 Epoche=1525\n",
      "Epsilon=0.750774 Action_times=2900091 Epoche=1526\n",
      "Epsilon=0.750754 Action_times=2900369 Epoche=1527\n",
      "Epsilon=0.750603 Action_times=2902407 Epoche=1528\n",
      "Epsilon=0.750583 Action_times=2902668 Epoche=1529\n",
      "Epsilon=0.750530 Action_times=2903388 Epoche=1530\n",
      "Epsilon=0.750490 Action_times=2903932 Epoche=1531\n",
      "Epsilon=0.750306 Action_times=2906413 Epoche=1532\n",
      "Epsilon=0.750202 Action_times=2907820 Epoche=1533\n",
      "Epsilon=0.750051 Action_times=2909860 Epoche=1534\n",
      "Epsilon=0.749992 Action_times=2910662 Epoche=1535\n",
      "Epsilon=0.749908 Action_times=2911791 Epoche=1536\n",
      "Epsilon=0.749835 Action_times=2912774 Epoche=1537\n",
      "Epsilon=0.749477 Action_times=2917615 Epoche=1538\n",
      "Epsilon=0.749344 Action_times=2919416 Epoche=1539\n",
      "Epsilon=0.749246 Action_times=2920737 Epoche=1540\n",
      "Epsilon=0.749104 Action_times=2922663 Epoche=1541\n",
      "Epsilon=0.748946 Action_times=2924801 Epoche=1542\n",
      "Epsilon=0.748847 Action_times=2926138 Epoche=1543\n",
      "Epsilon=0.748788 Action_times=2926934 Epoche=1544\n",
      "Epsilon=0.748669 Action_times=2928557 Epoche=1545\n",
      "Epsilon=0.748646 Action_times=2928867 Epoche=1546\n",
      "Epsilon=0.748608 Action_times=2929381 Epoche=1547\n",
      "Epsilon=0.748538 Action_times=2930327 Epoche=1548\n",
      "Epsilon=0.748482 Action_times=2931080 Epoche=1549\n",
      "Epsilon=0.748440 Action_times=2931650 Epoche=1550\n",
      "Epsilon=0.748415 Action_times=2931985 Epoche=1551\n",
      "Epsilon=0.748346 Action_times=2932930 Epoche=1552\n",
      "Epsilon=0.748256 Action_times=2934144 Epoche=1553\n",
      "Epsilon=0.748214 Action_times=2934718 Epoche=1554\n",
      "Epsilon=0.748125 Action_times=2935912 Epoche=1555\n",
      "Epsilon=0.748047 Action_times=2936974 Epoche=1556\n",
      "Epsilon=0.747999 Action_times=2937623 Epoche=1557\n",
      "Epsilon=0.747775 Action_times=2940658 Epoche=1558\n",
      "Epsilon=0.747752 Action_times=2940972 Epoche=1559\n",
      "Epsilon=0.747732 Action_times=2941238 Epoche=1560\n",
      "Epsilon=0.747678 Action_times=2941975 Epoche=1561\n",
      "Epsilon=0.747567 Action_times=2943476 Epoche=1562\n",
      "Epsilon=0.747558 Action_times=2943597 Epoche=1563\n",
      "Epsilon=0.747404 Action_times=2945687 Epoche=1564\n",
      "Epsilon=0.747345 Action_times=2946489 Epoche=1565\n",
      "Epsilon=0.747182 Action_times=2948698 Epoche=1566\n",
      "Epsilon=0.747027 Action_times=2950804 Epoche=1567\n",
      "Epsilon=0.746951 Action_times=2951833 Epoche=1568\n",
      "Epsilon=0.746909 Action_times=2952404 Epoche=1569\n",
      "Epsilon=0.746860 Action_times=2953074 Epoche=1570\n",
      "Epsilon=0.746732 Action_times=2954810 Epoche=1571\n",
      "Epsilon=0.746661 Action_times=2955776 Epoche=1572\n",
      "Epsilon=0.746618 Action_times=2956350 Epoche=1573\n",
      "Epsilon=0.746592 Action_times=2956708 Epoche=1574\n",
      "Epsilon=0.746356 Action_times=2959907 Epoche=1575\n",
      "Epsilon=0.746271 Action_times=2961063 Epoche=1576\n",
      "Epsilon=0.746173 Action_times=2962395 Epoche=1577\n",
      "Epsilon=0.746116 Action_times=2963174 Epoche=1578\n",
      "Epsilon=0.746066 Action_times=2963846 Epoche=1579\n",
      "Epsilon=0.745937 Action_times=2965599 Epoche=1580\n",
      "Epsilon=0.745832 Action_times=2967034 Epoche=1581\n",
      "Epsilon=0.745720 Action_times=2968551 Epoche=1582\n",
      "Epsilon=0.745586 Action_times=2970371 Epoche=1583\n",
      "Epsilon=0.745520 Action_times=2971272 Epoche=1584\n",
      "Epsilon=0.745376 Action_times=2973235 Epoche=1585\n",
      "Epsilon=0.745297 Action_times=2974308 Epoche=1586\n",
      "Epsilon=0.745266 Action_times=2974723 Epoche=1587\n",
      "Epsilon=0.745156 Action_times=2976219 Epoche=1588\n",
      "Epsilon=0.745113 Action_times=2976802 Epoche=1589\n",
      "Epsilon=0.745086 Action_times=2977181 Epoche=1590\n",
      "Epsilon=0.744957 Action_times=2978934 Epoche=1591\n",
      "Epsilon=0.744908 Action_times=2979603 Epoche=1592\n",
      "Epsilon=0.744848 Action_times=2980409 Epoche=1593\n",
      "Epsilon=0.744648 Action_times=2983136 Epoche=1594\n",
      "Epsilon=0.744553 Action_times=2984427 Epoche=1595\n",
      "Epsilon=0.744494 Action_times=2985230 Epoche=1596\n",
      "Epsilon=0.744346 Action_times=2987240 Epoche=1597\n",
      "Epsilon=0.744276 Action_times=2988197 Epoche=1598\n",
      "Epsilon=0.744183 Action_times=2989467 Epoche=1599\n",
      "Epsilon=0.744031 Action_times=2991533 Epoche=1600\n",
      "Epsilon=0.743990 Action_times=2992090 Epoche=1601\n",
      "Epsilon=0.743890 Action_times=2993459 Epoche=1602\n",
      "Epsilon=0.743803 Action_times=2994644 Epoche=1603\n",
      "Epsilon=0.743795 Action_times=2994747 Epoche=1604\n",
      "Epsilon=0.743751 Action_times=2995351 Epoche=1605\n",
      "Epsilon=0.743518 Action_times=2998534 Epoche=1606\n",
      "Epsilon=0.743499 Action_times=2998791 Epoche=1607\n",
      "Epsilon=0.743455 Action_times=2999391 Epoche=1608\n",
      "Epsilon=0.743274 Action_times=3001854 Epoche=1609\n",
      "Epsilon=0.743243 Action_times=3002280 Epoche=1610\n",
      "Epsilon=0.743207 Action_times=3002775 Epoche=1611\n",
      "Epsilon=0.743132 Action_times=3003785 Epoche=1612\n",
      "Epsilon=0.743025 Action_times=3005256 Epoche=1613\n",
      "Epsilon=0.742939 Action_times=3006431 Epoche=1614\n",
      "Epsilon=0.742852 Action_times=3007609 Epoche=1615\n",
      "Epsilon=0.742672 Action_times=3010067 Epoche=1616\n",
      "Epsilon=0.742624 Action_times=3010730 Epoche=1617\n",
      "Epsilon=0.742470 Action_times=3012825 Epoche=1618\n",
      "Epsilon=0.742409 Action_times=3013659 Epoche=1619\n",
      "Epsilon=0.742333 Action_times=3014692 Epoche=1620\n",
      "Epsilon=0.742320 Action_times=3014872 Epoche=1621\n",
      "Epsilon=0.742149 Action_times=3017212 Epoche=1622\n",
      "Epsilon=0.742007 Action_times=3019154 Epoche=1623\n",
      "Epsilon=0.741867 Action_times=3021061 Epoche=1624\n",
      "Epsilon=0.741798 Action_times=3022002 Epoche=1625\n",
      "Epsilon=0.741678 Action_times=3023639 Epoche=1626\n",
      "Epsilon=0.741606 Action_times=3024625 Epoche=1627\n",
      "Epsilon=0.741491 Action_times=3026197 Epoche=1628\n",
      "Epsilon=0.741374 Action_times=3027799 Epoche=1629\n",
      "Epsilon=0.741291 Action_times=3028937 Epoche=1630\n",
      "Epsilon=0.741164 Action_times=3030666 Epoche=1631\n",
      "Epsilon=0.741114 Action_times=3031352 Epoche=1632\n",
      "Epsilon=0.741065 Action_times=3032019 Epoche=1633\n",
      "Epsilon=0.740927 Action_times=3033913 Epoche=1634\n",
      "Epsilon=0.740815 Action_times=3035450 Epoche=1635\n",
      "Epsilon=0.740725 Action_times=3036682 Epoche=1636\n",
      "Epsilon=0.740642 Action_times=3037817 Epoche=1637\n",
      "Epsilon=0.740603 Action_times=3038342 Epoche=1638\n",
      "Epsilon=0.740538 Action_times=3039242 Epoche=1639\n",
      "Epsilon=0.740493 Action_times=3039847 Epoche=1640\n",
      "Epsilon=0.740471 Action_times=3040155 Epoche=1641\n",
      "Epsilon=0.740382 Action_times=3041370 Epoche=1642\n",
      "Epsilon=0.740334 Action_times=3042029 Epoche=1643\n",
      "Epsilon=0.740255 Action_times=3043118 Epoche=1644\n",
      "Epsilon=0.740218 Action_times=3043623 Epoche=1645\n",
      "Epsilon=0.740106 Action_times=3045156 Epoche=1646\n",
      "Epsilon=0.740019 Action_times=3046342 Epoche=1647\n",
      "Epsilon=0.739897 Action_times=3048016 Epoche=1648\n",
      "Epsilon=0.739828 Action_times=3048962 Epoche=1649\n",
      "Epsilon=0.739718 Action_times=3050466 Epoche=1650\n",
      "Epsilon=0.739696 Action_times=3050763 Epoche=1651\n",
      "Epsilon=0.739672 Action_times=3051097 Epoche=1652\n",
      "Epsilon=0.739569 Action_times=3052511 Epoche=1653\n",
      "Epsilon=0.739553 Action_times=3052733 Epoche=1654\n",
      "Epsilon=0.739423 Action_times=3054508 Epoche=1655\n",
      "Epsilon=0.739377 Action_times=3055139 Epoche=1656\n",
      "Epsilon=0.739328 Action_times=3055820 Epoche=1657\n",
      "Epsilon=0.739193 Action_times=3057661 Epoche=1658\n",
      "Epsilon=0.739163 Action_times=3058072 Epoche=1659\n",
      "Epsilon=0.739159 Action_times=3058129 Epoche=1660\n",
      "Epsilon=0.739068 Action_times=3059381 Epoche=1661\n",
      "Epsilon=0.738974 Action_times=3060663 Epoche=1662\n",
      "Epsilon=0.738951 Action_times=3060979 Epoche=1663\n",
      "Epsilon=0.738847 Action_times=3062406 Epoche=1664\n",
      "Epsilon=0.738665 Action_times=3064904 Epoche=1665\n",
      "Epsilon=0.738628 Action_times=3065414 Epoche=1666\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.738512 Action_times=3067005 Epoche=1667\n",
      "Epsilon=0.738319 Action_times=3069657 Epoche=1668\n",
      "Epsilon=0.738209 Action_times=3071174 Epoche=1669\n",
      "Epsilon=0.738113 Action_times=3072484 Epoche=1670\n",
      "Epsilon=0.737973 Action_times=3074409 Epoche=1671\n",
      "Epsilon=0.737893 Action_times=3075504 Epoche=1672\n",
      "Epsilon=0.737816 Action_times=3076569 Epoche=1673\n",
      "Epsilon=0.737770 Action_times=3077192 Epoche=1674\n",
      "Epsilon=0.737651 Action_times=3078829 Epoche=1675\n",
      "Epsilon=0.737569 Action_times=3079965 Epoche=1676\n",
      "Epsilon=0.737476 Action_times=3081234 Epoche=1677\n",
      "Epsilon=0.737400 Action_times=3082287 Epoche=1678\n",
      "Epsilon=0.737337 Action_times=3083157 Epoche=1679\n",
      "Epsilon=0.737259 Action_times=3084216 Epoche=1680\n",
      "Epsilon=0.737195 Action_times=3085097 Epoche=1681\n",
      "Epsilon=0.737156 Action_times=3085636 Epoche=1682\n",
      "Epsilon=0.737000 Action_times=3087787 Epoche=1683\n",
      "Epsilon=0.736903 Action_times=3089124 Epoche=1684\n",
      "Epsilon=0.736868 Action_times=3089599 Epoche=1685\n",
      "Epsilon=0.736794 Action_times=3090621 Epoche=1686\n",
      "Epsilon=0.736786 Action_times=3090730 Epoche=1687\n",
      "Epsilon=0.736726 Action_times=3091552 Epoche=1688\n",
      "Epsilon=0.736606 Action_times=3093201 Epoche=1689\n",
      "Epsilon=0.736556 Action_times=3093892 Epoche=1690\n",
      "Epsilon=0.736478 Action_times=3094973 Epoche=1691\n",
      "Epsilon=0.736370 Action_times=3096454 Epoche=1692\n",
      "Epsilon=0.736256 Action_times=3098024 Epoche=1693\n",
      "Epsilon=0.736094 Action_times=3100256 Epoche=1694\n",
      "Epsilon=0.736049 Action_times=3100871 Epoche=1695\n",
      "Epsilon=0.735989 Action_times=3101707 Epoche=1696\n",
      "Epsilon=0.735863 Action_times=3103432 Epoche=1697\n",
      "Epsilon=0.735807 Action_times=3104204 Epoche=1698\n",
      "Epsilon=0.735763 Action_times=3104815 Epoche=1699\n",
      "Epsilon=0.735706 Action_times=3105598 Epoche=1700\n",
      "Epsilon=0.735629 Action_times=3106661 Epoche=1701\n",
      "Epsilon=0.735560 Action_times=3107614 Epoche=1702\n",
      "Epsilon=0.735492 Action_times=3108546 Epoche=1703\n",
      "Epsilon=0.735427 Action_times=3109451 Epoche=1704\n",
      "Epsilon=0.735312 Action_times=3111037 Epoche=1705\n",
      "Epsilon=0.735159 Action_times=3113139 Epoche=1706\n",
      "Epsilon=0.735098 Action_times=3113986 Epoche=1707\n",
      "Epsilon=0.735056 Action_times=3114555 Epoche=1708\n",
      "Epsilon=0.734961 Action_times=3115874 Epoche=1709\n",
      "Epsilon=0.734849 Action_times=3117413 Epoche=1710\n",
      "Epsilon=0.734743 Action_times=3118880 Epoche=1711\n",
      "Epsilon=0.734620 Action_times=3120571 Epoche=1712\n",
      "Epsilon=0.734602 Action_times=3120821 Epoche=1713\n",
      "Epsilon=0.734438 Action_times=3123093 Epoche=1714\n",
      "Epsilon=0.734374 Action_times=3123976 Epoche=1715\n",
      "Epsilon=0.734331 Action_times=3124564 Epoche=1716\n",
      "Epsilon=0.734232 Action_times=3125927 Epoche=1717\n",
      "Epsilon=0.734187 Action_times=3126549 Epoche=1718\n",
      "Epsilon=0.734053 Action_times=3128401 Epoche=1719\n",
      "Epsilon=0.733874 Action_times=3130879 Epoche=1720\n",
      "Epsilon=0.733723 Action_times=3132966 Epoche=1721\n",
      "Epsilon=0.733665 Action_times=3133758 Epoche=1722\n",
      "Epsilon=0.733607 Action_times=3134572 Epoche=1723\n",
      "Epsilon=0.733543 Action_times=3135452 Epoche=1724\n",
      "Epsilon=0.733478 Action_times=3136350 Epoche=1725\n",
      "Epsilon=0.733399 Action_times=3137439 Epoche=1726\n",
      "Epsilon=0.733289 Action_times=3138955 Epoche=1727\n",
      "Epsilon=0.733213 Action_times=3140010 Epoche=1728\n",
      "Epsilon=0.733162 Action_times=3140719 Epoche=1729\n",
      "Epsilon=0.733144 Action_times=3140968 Epoche=1730\n",
      "Epsilon=0.733119 Action_times=3141317 Epoche=1731\n",
      "Epsilon=0.733032 Action_times=3142508 Epoche=1732\n",
      "Epsilon=0.732890 Action_times=3144477 Epoche=1733\n",
      "Epsilon=0.732807 Action_times=3145622 Epoche=1734\n",
      "Epsilon=0.732673 Action_times=3147481 Epoche=1735\n",
      "Epsilon=0.732640 Action_times=3147940 Epoche=1736\n",
      "Epsilon=0.732355 Action_times=3151881 Epoche=1737\n",
      "Epsilon=0.732239 Action_times=3153482 Epoche=1738\n",
      "Epsilon=0.732070 Action_times=3155822 Epoche=1739\n",
      "Epsilon=0.732039 Action_times=3156255 Epoche=1740\n",
      "Epsilon=0.731904 Action_times=3158129 Epoche=1741\n",
      "Epsilon=0.731732 Action_times=3160509 Epoche=1742\n",
      "Epsilon=0.731615 Action_times=3162125 Epoche=1743\n",
      "Epsilon=0.731489 Action_times=3163879 Epoche=1744\n",
      "Epsilon=0.731447 Action_times=3164463 Epoche=1745\n",
      "Epsilon=0.731351 Action_times=3165792 Epoche=1746\n",
      "Epsilon=0.731254 Action_times=3167129 Epoche=1747\n",
      "Epsilon=0.731180 Action_times=3168158 Epoche=1748\n",
      "Epsilon=0.731103 Action_times=3169231 Epoche=1749\n",
      "Epsilon=0.730994 Action_times=3170748 Epoche=1750\n",
      "Epsilon=0.730933 Action_times=3171593 Epoche=1751\n",
      "Epsilon=0.730839 Action_times=3172888 Epoche=1752\n",
      "Epsilon=0.730802 Action_times=3173403 Epoche=1753\n",
      "Epsilon=0.730754 Action_times=3174065 Epoche=1754\n",
      "Epsilon=0.730653 Action_times=3175472 Epoche=1755\n",
      "Epsilon=0.730564 Action_times=3176706 Epoche=1756\n",
      "Epsilon=0.730463 Action_times=3178106 Epoche=1757\n",
      "Epsilon=0.730449 Action_times=3178306 Epoche=1758\n",
      "Epsilon=0.730369 Action_times=3179407 Epoche=1759\n",
      "Epsilon=0.730341 Action_times=3179796 Epoche=1760\n",
      "Epsilon=0.730285 Action_times=3180584 Epoche=1761\n",
      "Epsilon=0.730222 Action_times=3181450 Epoche=1762\n",
      "Epsilon=0.730152 Action_times=3182428 Epoche=1763\n",
      "Epsilon=0.730106 Action_times=3183069 Epoche=1764\n",
      "Epsilon=0.729946 Action_times=3185283 Epoche=1765\n",
      "Epsilon=0.729863 Action_times=3186443 Epoche=1766\n",
      "Epsilon=0.729681 Action_times=3188972 Epoche=1767\n",
      "Epsilon=0.729638 Action_times=3189561 Epoche=1768\n",
      "Epsilon=0.729538 Action_times=3190960 Epoche=1769\n",
      "Epsilon=0.729440 Action_times=3192316 Epoche=1770\n",
      "Epsilon=0.729342 Action_times=3193682 Epoche=1771\n",
      "Epsilon=0.729215 Action_times=3195451 Epoche=1772\n",
      "Epsilon=0.729162 Action_times=3196186 Epoche=1773\n",
      "Epsilon=0.729080 Action_times=3197327 Epoche=1774\n",
      "Epsilon=0.729017 Action_times=3198195 Epoche=1775\n",
      "Epsilon=0.728967 Action_times=3198896 Epoche=1776\n",
      "Epsilon=0.728879 Action_times=3200112 Epoche=1777\n",
      "Epsilon=0.728746 Action_times=3201973 Epoche=1778\n",
      "Epsilon=0.728511 Action_times=3205243 Epoche=1779\n",
      "Epsilon=0.728440 Action_times=3206232 Epoche=1780\n",
      "Epsilon=0.728268 Action_times=3208625 Epoche=1781\n",
      "Epsilon=0.728160 Action_times=3210127 Epoche=1782\n",
      "Epsilon=0.728065 Action_times=3211451 Epoche=1783\n",
      "Epsilon=0.727910 Action_times=3213607 Epoche=1784\n",
      "Epsilon=0.727781 Action_times=3215398 Epoche=1785\n",
      "Epsilon=0.727608 Action_times=3217810 Epoche=1786\n",
      "Epsilon=0.727518 Action_times=3219076 Epoche=1787\n",
      "Epsilon=0.727406 Action_times=3220637 Epoche=1788\n",
      "Epsilon=0.727355 Action_times=3221343 Epoche=1789\n",
      "Epsilon=0.727256 Action_times=3222727 Epoche=1790\n",
      "Epsilon=0.727197 Action_times=3223540 Epoche=1791\n",
      "Epsilon=0.727029 Action_times=3225883 Epoche=1792\n",
      "Epsilon=0.726773 Action_times=3229462 Epoche=1793\n",
      "Epsilon=0.726642 Action_times=3231288 Epoche=1794\n",
      "Epsilon=0.726614 Action_times=3231672 Epoche=1795\n",
      "Epsilon=0.726580 Action_times=3232148 Epoche=1796\n",
      "Epsilon=0.726449 Action_times=3233981 Epoche=1797\n",
      "Epsilon=0.726398 Action_times=3234687 Epoche=1798\n",
      "Epsilon=0.726285 Action_times=3236274 Epoche=1799\n",
      "Epsilon=0.726223 Action_times=3237127 Epoche=1800\n",
      "Epsilon=0.726134 Action_times=3238375 Epoche=1801\n",
      "Epsilon=0.726111 Action_times=3238700 Epoche=1802\n",
      "Epsilon=0.726009 Action_times=3240123 Epoche=1803\n",
      "Epsilon=0.726006 Action_times=3240162 Epoche=1804\n",
      "Epsilon=0.725893 Action_times=3241740 Epoche=1805\n",
      "Epsilon=0.725827 Action_times=3242669 Epoche=1806\n",
      "Epsilon=0.725782 Action_times=3243296 Epoche=1807\n",
      "Epsilon=0.725664 Action_times=3244942 Epoche=1808\n",
      "Epsilon=0.725606 Action_times=3245748 Epoche=1809\n",
      "Epsilon=0.725386 Action_times=3248827 Epoche=1810\n",
      "Epsilon=0.725312 Action_times=3249863 Epoche=1811\n",
      "Epsilon=0.725206 Action_times=3251348 Epoche=1812\n",
      "Epsilon=0.725088 Action_times=3252991 Epoche=1813\n",
      "Epsilon=0.725082 Action_times=3253073 Epoche=1814\n",
      "Epsilon=0.725014 Action_times=3254022 Epoche=1815\n",
      "Epsilon=0.724907 Action_times=3255527 Epoche=1816\n",
      "Epsilon=0.724752 Action_times=3257698 Epoche=1817\n",
      "Epsilon=0.724646 Action_times=3259183 Epoche=1818\n",
      "Epsilon=0.724535 Action_times=3260736 Epoche=1819\n",
      "Epsilon=0.724380 Action_times=3262903 Epoche=1820\n",
      "Epsilon=0.724191 Action_times=3265549 Epoche=1821\n",
      "Epsilon=0.724003 Action_times=3268174 Epoche=1822\n",
      "Epsilon=0.723809 Action_times=3270896 Epoche=1823\n",
      "Epsilon=0.723796 Action_times=3271073 Epoche=1824\n",
      "Epsilon=0.723692 Action_times=3272539 Epoche=1825\n",
      "Epsilon=0.723594 Action_times=3273910 Epoche=1826\n",
      "Epsilon=0.723504 Action_times=3275175 Epoche=1827\n",
      "Epsilon=0.723405 Action_times=3276553 Epoche=1828\n",
      "Epsilon=0.723360 Action_times=3277187 Epoche=1829\n",
      "Epsilon=0.723242 Action_times=3278842 Epoche=1830\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.723094 Action_times=3280920 Epoche=1831\n",
      "Epsilon=0.722993 Action_times=3282329 Epoche=1832\n",
      "Epsilon=0.722915 Action_times=3283429 Epoche=1833\n",
      "Epsilon=0.722833 Action_times=3284575 Epoche=1834\n",
      "Epsilon=0.722829 Action_times=3284638 Epoche=1835\n",
      "Epsilon=0.722756 Action_times=3285663 Epoche=1836\n",
      "Epsilon=0.722653 Action_times=3287097 Epoche=1837\n",
      "Epsilon=0.722529 Action_times=3288847 Epoche=1838\n",
      "Epsilon=0.722478 Action_times=3289566 Epoche=1839\n",
      "Epsilon=0.722406 Action_times=3290569 Epoche=1840\n",
      "Epsilon=0.722300 Action_times=3292056 Epoche=1841\n",
      "Epsilon=0.722208 Action_times=3293354 Epoche=1842\n",
      "Epsilon=0.722110 Action_times=3294722 Epoche=1843\n",
      "Epsilon=0.722051 Action_times=3295550 Epoche=1844\n",
      "Epsilon=0.722022 Action_times=3295961 Epoche=1845\n",
      "Epsilon=0.721936 Action_times=3297172 Epoche=1846\n",
      "Epsilon=0.721849 Action_times=3298397 Epoche=1847\n",
      "Epsilon=0.721763 Action_times=3299594 Epoche=1848\n",
      "Epsilon=0.721634 Action_times=3301414 Epoche=1849\n",
      "Epsilon=0.721607 Action_times=3301793 Epoche=1850\n",
      "Epsilon=0.721461 Action_times=3303838 Epoche=1851\n",
      "Epsilon=0.721316 Action_times=3305883 Epoche=1852\n",
      "Epsilon=0.721266 Action_times=3306585 Epoche=1853\n",
      "Epsilon=0.721123 Action_times=3308600 Epoche=1854\n",
      "Epsilon=0.721007 Action_times=3310226 Epoche=1855\n",
      "Epsilon=0.720822 Action_times=3312834 Epoche=1856\n",
      "Epsilon=0.720782 Action_times=3313388 Epoche=1857\n",
      "Epsilon=0.720634 Action_times=3315481 Epoche=1858\n",
      "Epsilon=0.720532 Action_times=3316908 Epoche=1859\n",
      "Epsilon=0.720397 Action_times=3318806 Epoche=1860\n",
      "Epsilon=0.720266 Action_times=3320648 Epoche=1861\n",
      "Epsilon=0.720261 Action_times=3320727 Epoche=1862\n",
      "Epsilon=0.720225 Action_times=3321229 Epoche=1863\n",
      "Epsilon=0.720136 Action_times=3322489 Epoche=1864\n",
      "Epsilon=0.720024 Action_times=3324059 Epoche=1865\n",
      "Epsilon=0.719925 Action_times=3325456 Epoche=1866\n",
      "Epsilon=0.719707 Action_times=3328526 Epoche=1867\n",
      "Epsilon=0.719531 Action_times=3331009 Epoche=1868\n",
      "Epsilon=0.719435 Action_times=3332367 Epoche=1869\n",
      "Epsilon=0.719334 Action_times=3333784 Epoche=1870\n",
      "Epsilon=0.719144 Action_times=3336467 Epoche=1871\n",
      "Epsilon=0.719035 Action_times=3338003 Epoche=1872\n",
      "Epsilon=0.719012 Action_times=3338329 Epoche=1873\n",
      "Epsilon=0.718934 Action_times=3339429 Epoche=1874\n",
      "Epsilon=0.718928 Action_times=3339504 Epoche=1875\n",
      "Epsilon=0.718883 Action_times=3340143 Epoche=1876\n",
      "Epsilon=0.718819 Action_times=3341045 Epoche=1877\n",
      "Epsilon=0.718810 Action_times=3341181 Epoche=1878\n",
      "Epsilon=0.718758 Action_times=3341915 Epoche=1879\n",
      "Epsilon=0.718706 Action_times=3342636 Epoche=1880\n",
      "Epsilon=0.718627 Action_times=3343750 Epoche=1881\n",
      "Epsilon=0.718496 Action_times=3345607 Epoche=1882\n",
      "Epsilon=0.718402 Action_times=3346928 Epoche=1883\n",
      "Epsilon=0.718322 Action_times=3348068 Epoche=1884\n",
      "Epsilon=0.718265 Action_times=3348870 Epoche=1885\n",
      "Epsilon=0.718121 Action_times=3350897 Epoche=1886\n",
      "Epsilon=0.718017 Action_times=3352371 Epoche=1887\n",
      "Epsilon=0.717897 Action_times=3354064 Epoche=1888\n",
      "Epsilon=0.717851 Action_times=3354709 Epoche=1889\n",
      "Epsilon=0.717793 Action_times=3355529 Epoche=1890\n",
      "Epsilon=0.717742 Action_times=3356254 Epoche=1891\n",
      "Epsilon=0.717679 Action_times=3357146 Epoche=1892\n",
      "Epsilon=0.717667 Action_times=3357318 Epoche=1893\n",
      "Epsilon=0.717566 Action_times=3358747 Epoche=1894\n",
      "Epsilon=0.717500 Action_times=3359675 Epoche=1895\n",
      "Epsilon=0.717376 Action_times=3361425 Epoche=1896\n",
      "Epsilon=0.717192 Action_times=3364027 Epoche=1897\n",
      "Epsilon=0.717043 Action_times=3366133 Epoche=1898\n",
      "Epsilon=0.716981 Action_times=3367017 Epoche=1899\n",
      "Epsilon=0.716923 Action_times=3367834 Epoche=1900\n",
      "Epsilon=0.716811 Action_times=3369413 Epoche=1901\n",
      "Epsilon=0.716694 Action_times=3371074 Epoche=1902\n",
      "Epsilon=0.716674 Action_times=3371351 Epoche=1903\n",
      "Epsilon=0.716551 Action_times=3373096 Epoche=1904\n",
      "Epsilon=0.716498 Action_times=3373845 Epoche=1905\n",
      "Epsilon=0.716368 Action_times=3375681 Epoche=1906\n",
      "Epsilon=0.716295 Action_times=3376714 Epoche=1907\n",
      "Epsilon=0.716201 Action_times=3378049 Epoche=1908\n",
      "Epsilon=0.716116 Action_times=3379257 Epoche=1909\n",
      "Epsilon=0.716042 Action_times=3380296 Epoche=1910\n",
      "Epsilon=0.715976 Action_times=3381242 Epoche=1911\n",
      "Epsilon=0.715837 Action_times=3383207 Epoche=1912\n",
      "Epsilon=0.715734 Action_times=3384665 Epoche=1913\n",
      "Epsilon=0.715574 Action_times=3386937 Epoche=1914\n",
      "Epsilon=0.715444 Action_times=3388773 Epoche=1915\n",
      "Epsilon=0.715313 Action_times=3390635 Epoche=1916\n",
      "Epsilon=0.715200 Action_times=3392235 Epoche=1917\n",
      "Epsilon=0.715170 Action_times=3392660 Epoche=1918\n",
      "Epsilon=0.715104 Action_times=3393603 Epoche=1919\n",
      "Epsilon=0.715037 Action_times=3394540 Epoche=1920\n",
      "Epsilon=0.714985 Action_times=3395279 Epoche=1921\n",
      "Epsilon=0.714959 Action_times=3395655 Epoche=1922\n",
      "Epsilon=0.714880 Action_times=3396775 Epoche=1923\n",
      "Epsilon=0.714794 Action_times=3397989 Epoche=1924\n",
      "Epsilon=0.714718 Action_times=3399078 Epoche=1925\n",
      "Epsilon=0.714665 Action_times=3399826 Epoche=1926\n",
      "Epsilon=0.714623 Action_times=3400427 Epoche=1927\n",
      "Epsilon=0.714597 Action_times=3400792 Epoche=1928\n",
      "Epsilon=0.714566 Action_times=3401228 Epoche=1929\n",
      "Epsilon=0.714543 Action_times=3401560 Epoche=1930\n",
      "Epsilon=0.714490 Action_times=3402303 Epoche=1931\n",
      "Epsilon=0.714406 Action_times=3403497 Epoche=1932\n",
      "Epsilon=0.714286 Action_times=3405202 Epoche=1933\n",
      "Epsilon=0.714220 Action_times=3406140 Epoche=1934\n",
      "Epsilon=0.714157 Action_times=3407040 Epoche=1935\n",
      "Epsilon=0.714051 Action_times=3408538 Epoche=1936\n",
      "Epsilon=0.713944 Action_times=3410064 Epoche=1937\n",
      "Epsilon=0.713814 Action_times=3411906 Epoche=1938\n",
      "Epsilon=0.713761 Action_times=3412663 Epoche=1939\n",
      "Epsilon=0.713722 Action_times=3413222 Epoche=1940\n",
      "Epsilon=0.713665 Action_times=3414028 Epoche=1941\n",
      "Epsilon=0.713625 Action_times=3414591 Epoche=1942\n",
      "Epsilon=0.713529 Action_times=3415954 Epoche=1943\n",
      "Epsilon=0.713453 Action_times=3417045 Epoche=1944\n",
      "Epsilon=0.713419 Action_times=3417528 Epoche=1945\n",
      "Epsilon=0.713377 Action_times=3418113 Epoche=1946\n",
      "Epsilon=0.713278 Action_times=3419531 Epoche=1947\n",
      "Epsilon=0.713196 Action_times=3420686 Epoche=1948\n",
      "Epsilon=0.713196 Action_times=3420699 Epoche=1949\n",
      "Epsilon=0.712997 Action_times=3423521 Epoche=1950\n",
      "Epsilon=0.712924 Action_times=3424566 Epoche=1951\n",
      "Epsilon=0.712847 Action_times=3425661 Epoche=1952\n",
      "Epsilon=0.712774 Action_times=3426697 Epoche=1953\n",
      "Epsilon=0.712687 Action_times=3427938 Epoche=1954\n",
      "Epsilon=0.712661 Action_times=3428300 Epoche=1955\n",
      "Epsilon=0.712576 Action_times=3429510 Epoche=1956\n",
      "Epsilon=0.712542 Action_times=3429996 Epoche=1957\n",
      "Epsilon=0.712514 Action_times=3430400 Epoche=1958\n",
      "Epsilon=0.712467 Action_times=3431071 Epoche=1959\n",
      "Epsilon=0.712390 Action_times=3432166 Epoche=1960\n",
      "Epsilon=0.712194 Action_times=3434951 Epoche=1961\n",
      "Epsilon=0.712110 Action_times=3436152 Epoche=1962\n",
      "Epsilon=0.712021 Action_times=3437413 Epoche=1963\n",
      "Epsilon=0.711904 Action_times=3439084 Epoche=1964\n",
      "Epsilon=0.711854 Action_times=3439802 Epoche=1965\n",
      "Epsilon=0.711823 Action_times=3440241 Epoche=1966\n",
      "Epsilon=0.711774 Action_times=3440939 Epoche=1967\n",
      "Epsilon=0.711737 Action_times=3441463 Epoche=1968\n",
      "Epsilon=0.711665 Action_times=3442486 Epoche=1969\n",
      "Epsilon=0.711571 Action_times=3443829 Epoche=1970\n",
      "Epsilon=0.711468 Action_times=3445300 Epoche=1971\n",
      "Epsilon=0.711400 Action_times=3446271 Epoche=1972\n",
      "Epsilon=0.711348 Action_times=3447012 Epoche=1973\n",
      "Epsilon=0.711326 Action_times=3447324 Epoche=1974\n",
      "Epsilon=0.711242 Action_times=3448515 Epoche=1975\n",
      "Epsilon=0.711214 Action_times=3448916 Epoche=1976\n",
      "Epsilon=0.711139 Action_times=3449988 Epoche=1977\n",
      "Epsilon=0.711112 Action_times=3450376 Epoche=1978\n",
      "Epsilon=0.711073 Action_times=3450931 Epoche=1979\n",
      "Epsilon=0.710928 Action_times=3452997 Epoche=1980\n",
      "Epsilon=0.710777 Action_times=3455154 Epoche=1981\n",
      "Epsilon=0.710644 Action_times=3457049 Epoche=1982\n",
      "Epsilon=0.710579 Action_times=3457976 Epoche=1983\n",
      "Epsilon=0.710453 Action_times=3459781 Epoche=1984\n",
      "Epsilon=0.710349 Action_times=3461265 Epoche=1985\n",
      "Epsilon=0.710229 Action_times=3462979 Epoche=1986\n",
      "Epsilon=0.710183 Action_times=3463638 Epoche=1987\n",
      "Epsilon=0.710148 Action_times=3464138 Epoche=1988\n",
      "Epsilon=0.710061 Action_times=3465369 Epoche=1989\n",
      "Epsilon=0.709998 Action_times=3466280 Epoche=1990\n",
      "Epsilon=0.709786 Action_times=3469298 Epoche=1991\n",
      "Epsilon=0.709756 Action_times=3469727 Epoche=1992\n",
      "Epsilon=0.709696 Action_times=3470588 Epoche=1993\n",
      "Epsilon=0.709567 Action_times=3472433 Epoche=1994\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.709466 Action_times=3473874 Epoche=1995\n",
      "Epsilon=0.709361 Action_times=3475383 Epoche=1996\n",
      "Epsilon=0.709148 Action_times=3478426 Epoche=1997\n",
      "Epsilon=0.709028 Action_times=3480144 Epoche=1998\n",
      "Epsilon=0.708968 Action_times=3480999 Epoche=1999\n",
      "Epsilon=0.708787 Action_times=3483594 Epoche=2000\n",
      "Epsilon=0.708670 Action_times=3485264 Epoche=2001\n",
      "Epsilon=0.708549 Action_times=3486990 Epoche=2002\n",
      "Epsilon=0.708457 Action_times=3488317 Epoche=2003\n",
      "Epsilon=0.708384 Action_times=3489360 Epoche=2004\n",
      "Epsilon=0.708328 Action_times=3490165 Epoche=2005\n",
      "Epsilon=0.708287 Action_times=3490754 Epoche=2006\n",
      "Epsilon=0.708215 Action_times=3491784 Epoche=2007\n",
      "Epsilon=0.708129 Action_times=3493006 Epoche=2008\n",
      "Epsilon=0.708048 Action_times=3494165 Epoche=2009\n",
      "Epsilon=0.707993 Action_times=3494954 Epoche=2010\n",
      "Epsilon=0.707909 Action_times=3496169 Epoche=2011\n",
      "Epsilon=0.707833 Action_times=3497253 Epoche=2012\n",
      "Epsilon=0.707745 Action_times=3498509 Epoche=2013\n",
      "Epsilon=0.707735 Action_times=3498662 Epoche=2014\n",
      "Epsilon=0.707703 Action_times=3499120 Epoche=2015\n",
      "Epsilon=0.707610 Action_times=3500445 Epoche=2016\n",
      "Epsilon=0.707542 Action_times=3501422 Epoche=2017\n",
      "Epsilon=0.707473 Action_times=3502417 Epoche=2018\n",
      "Epsilon=0.707355 Action_times=3504107 Epoche=2019\n",
      "Epsilon=0.707292 Action_times=3505010 Epoche=2020\n",
      "Epsilon=0.707282 Action_times=3505150 Epoche=2021\n",
      "Epsilon=0.707234 Action_times=3505845 Epoche=2022\n",
      "Epsilon=0.707204 Action_times=3506270 Epoche=2023\n",
      "Epsilon=0.707183 Action_times=3506567 Epoche=2024\n",
      "Epsilon=0.707093 Action_times=3507861 Epoche=2025\n",
      "Epsilon=0.707060 Action_times=3508333 Epoche=2026\n",
      "Epsilon=0.706995 Action_times=3509268 Epoche=2027\n",
      "Epsilon=0.706924 Action_times=3510284 Epoche=2028\n",
      "Epsilon=0.706788 Action_times=3512238 Epoche=2029\n",
      "Epsilon=0.706719 Action_times=3513233 Epoche=2030\n",
      "Epsilon=0.706656 Action_times=3514136 Epoche=2031\n",
      "Epsilon=0.706519 Action_times=3516100 Epoche=2032\n",
      "Epsilon=0.706371 Action_times=3518222 Epoche=2033\n",
      "Epsilon=0.706360 Action_times=3518383 Epoche=2034\n",
      "Epsilon=0.706267 Action_times=3519724 Epoche=2035\n",
      "Epsilon=0.706050 Action_times=3522828 Epoche=2036\n",
      "Epsilon=0.705936 Action_times=3524471 Epoche=2037\n",
      "Epsilon=0.705910 Action_times=3524849 Epoche=2038\n",
      "Epsilon=0.705846 Action_times=3525761 Epoche=2039\n",
      "Epsilon=0.705722 Action_times=3527552 Epoche=2040\n",
      "Epsilon=0.705405 Action_times=3532108 Epoche=2041\n",
      "Epsilon=0.705347 Action_times=3532933 Epoche=2042\n",
      "Epsilon=0.705321 Action_times=3533311 Epoche=2043\n",
      "Epsilon=0.705279 Action_times=3533920 Epoche=2044\n",
      "Epsilon=0.705211 Action_times=3534900 Epoche=2045\n",
      "Epsilon=0.705066 Action_times=3536987 Epoche=2046\n",
      "Epsilon=0.705008 Action_times=3537813 Epoche=2047\n",
      "Epsilon=0.704947 Action_times=3538689 Epoche=2048\n",
      "Epsilon=0.704921 Action_times=3539065 Epoche=2049\n",
      "Epsilon=0.704884 Action_times=3539598 Epoche=2050\n",
      "Epsilon=0.704817 Action_times=3540571 Epoche=2051\n",
      "Epsilon=0.704742 Action_times=3541641 Epoche=2052\n",
      "Epsilon=0.704589 Action_times=3543852 Epoche=2053\n",
      "Epsilon=0.704472 Action_times=3545535 Epoche=2054\n",
      "Epsilon=0.704363 Action_times=3547099 Epoche=2055\n",
      "Epsilon=0.704326 Action_times=3547635 Epoche=2056\n",
      "Epsilon=0.704311 Action_times=3547854 Epoche=2057\n",
      "Epsilon=0.704234 Action_times=3548960 Epoche=2058\n",
      "Epsilon=0.704163 Action_times=3549980 Epoche=2059\n",
      "Epsilon=0.704117 Action_times=3550639 Epoche=2060\n",
      "Epsilon=0.704024 Action_times=3551981 Epoche=2061\n",
      "Epsilon=0.703995 Action_times=3552400 Epoche=2062\n",
      "Epsilon=0.703976 Action_times=3552673 Epoche=2063\n",
      "Epsilon=0.703957 Action_times=3552943 Epoche=2064\n",
      "Epsilon=0.703899 Action_times=3553786 Epoche=2065\n",
      "Epsilon=0.703774 Action_times=3555586 Epoche=2066\n",
      "Epsilon=0.703713 Action_times=3556468 Epoche=2067\n",
      "Epsilon=0.703664 Action_times=3557173 Epoche=2068\n",
      "Epsilon=0.703607 Action_times=3557992 Epoche=2069\n",
      "Epsilon=0.703593 Action_times=3558201 Epoche=2070\n",
      "Epsilon=0.703514 Action_times=3559328 Epoche=2071\n",
      "Epsilon=0.703353 Action_times=3561658 Epoche=2072\n",
      "Epsilon=0.703263 Action_times=3562961 Epoche=2073\n",
      "Epsilon=0.703207 Action_times=3563756 Epoche=2074\n",
      "Epsilon=0.703082 Action_times=3565561 Epoche=2075\n",
      "Epsilon=0.702986 Action_times=3566946 Epoche=2076\n",
      "Epsilon=0.702959 Action_times=3567335 Epoche=2077\n",
      "Epsilon=0.702915 Action_times=3567982 Epoche=2078\n",
      "Epsilon=0.702830 Action_times=3569196 Epoche=2079\n",
      "Epsilon=0.702808 Action_times=3569515 Epoche=2080\n",
      "Epsilon=0.702659 Action_times=3571670 Epoche=2081\n",
      "Epsilon=0.702585 Action_times=3572741 Epoche=2082\n",
      "Epsilon=0.702513 Action_times=3573777 Epoche=2083\n",
      "Epsilon=0.702507 Action_times=3573869 Epoche=2084\n",
      "Epsilon=0.702428 Action_times=3575000 Epoche=2085\n",
      "Epsilon=0.702307 Action_times=3576756 Epoche=2086\n",
      "Epsilon=0.702146 Action_times=3579077 Epoche=2087\n",
      "Epsilon=0.702123 Action_times=3579408 Epoche=2088\n",
      "Epsilon=0.702074 Action_times=3580114 Epoche=2089\n",
      "Epsilon=0.701991 Action_times=3581315 Epoche=2090\n",
      "Epsilon=0.701947 Action_times=3581955 Epoche=2091\n",
      "Epsilon=0.701922 Action_times=3582324 Epoche=2092\n",
      "Epsilon=0.701844 Action_times=3583442 Epoche=2093\n",
      "Epsilon=0.701798 Action_times=3584107 Epoche=2094\n",
      "Epsilon=0.701646 Action_times=3586311 Epoche=2095\n",
      "Epsilon=0.701571 Action_times=3587392 Epoche=2096\n",
      "Epsilon=0.701478 Action_times=3588740 Epoche=2097\n",
      "Epsilon=0.701386 Action_times=3590069 Epoche=2098\n",
      "Epsilon=0.701102 Action_times=3594170 Epoche=2099\n",
      "Epsilon=0.701036 Action_times=3595125 Epoche=2100\n",
      "Epsilon=0.700935 Action_times=3596599 Epoche=2101\n",
      "Epsilon=0.700870 Action_times=3597536 Epoche=2102\n",
      "Epsilon=0.700752 Action_times=3599244 Epoche=2103\n",
      "Epsilon=0.700656 Action_times=3600624 Epoche=2104\n",
      "Epsilon=0.700592 Action_times=3601562 Epoche=2105\n",
      "Epsilon=0.700490 Action_times=3603041 Epoche=2106\n",
      "Epsilon=0.700449 Action_times=3603623 Epoche=2107\n",
      "Epsilon=0.700334 Action_times=3605289 Epoche=2108\n",
      "Epsilon=0.700249 Action_times=3606520 Epoche=2109\n",
      "Epsilon=0.700226 Action_times=3606859 Epoche=2110\n",
      "Epsilon=0.700207 Action_times=3607134 Epoche=2111\n",
      "Epsilon=0.700173 Action_times=3607632 Epoche=2112\n",
      "Epsilon=0.700154 Action_times=3607903 Epoche=2113\n",
      "Epsilon=0.700129 Action_times=3608267 Epoche=2114\n",
      "Epsilon=0.700065 Action_times=3609194 Epoche=2115\n",
      "Epsilon=0.700035 Action_times=3609621 Epoche=2116\n",
      "Epsilon=0.699957 Action_times=3610751 Epoche=2117\n",
      "Epsilon=0.699856 Action_times=3612223 Epoche=2118\n",
      "Epsilon=0.699766 Action_times=3613525 Epoche=2119\n",
      "Epsilon=0.699695 Action_times=3614551 Epoche=2120\n",
      "Epsilon=0.699583 Action_times=3616172 Epoche=2121\n",
      "Epsilon=0.699540 Action_times=3616807 Epoche=2122\n",
      "Epsilon=0.699440 Action_times=3618246 Epoche=2123\n",
      "Epsilon=0.699390 Action_times=3618985 Epoche=2124\n",
      "Epsilon=0.699336 Action_times=3619761 Epoche=2125\n",
      "Epsilon=0.699268 Action_times=3620752 Epoche=2126\n",
      "Epsilon=0.699177 Action_times=3622065 Epoche=2127\n",
      "Epsilon=0.699117 Action_times=3622937 Epoche=2128\n",
      "Epsilon=0.699040 Action_times=3624060 Epoche=2129\n",
      "Epsilon=0.698967 Action_times=3625115 Epoche=2130\n",
      "Epsilon=0.698916 Action_times=3625850 Epoche=2131\n",
      "Epsilon=0.698862 Action_times=3626633 Epoche=2132\n",
      "Epsilon=0.698704 Action_times=3628930 Epoche=2133\n",
      "Epsilon=0.698633 Action_times=3629967 Epoche=2134\n",
      "Epsilon=0.698596 Action_times=3630502 Epoche=2135\n",
      "Epsilon=0.698579 Action_times=3630746 Epoche=2136\n",
      "Epsilon=0.698570 Action_times=3630884 Epoche=2137\n",
      "Epsilon=0.698524 Action_times=3631550 Epoche=2138\n",
      "Epsilon=0.698469 Action_times=3632341 Epoche=2139\n",
      "Epsilon=0.698333 Action_times=3634320 Epoche=2140\n",
      "Epsilon=0.698310 Action_times=3634649 Epoche=2141\n",
      "Epsilon=0.698275 Action_times=3635172 Epoche=2142\n",
      "Epsilon=0.698154 Action_times=3636926 Epoche=2143\n",
      "Epsilon=0.698045 Action_times=3638502 Epoche=2144\n",
      "Epsilon=0.697915 Action_times=3640400 Epoche=2145\n",
      "Epsilon=0.697828 Action_times=3641667 Epoche=2146\n",
      "Epsilon=0.697761 Action_times=3642630 Epoche=2147\n",
      "Epsilon=0.697714 Action_times=3643322 Epoche=2148\n",
      "Epsilon=0.697680 Action_times=3643817 Epoche=2149\n",
      "Epsilon=0.697597 Action_times=3645017 Epoche=2150\n",
      "Epsilon=0.697552 Action_times=3645681 Epoche=2151\n",
      "Epsilon=0.697438 Action_times=3647334 Epoche=2152\n",
      "Epsilon=0.697324 Action_times=3648991 Epoche=2153\n",
      "Epsilon=0.697194 Action_times=3650885 Epoche=2154\n",
      "Epsilon=0.697144 Action_times=3651614 Epoche=2155\n",
      "Epsilon=0.697092 Action_times=3652367 Epoche=2156\n",
      "Epsilon=0.697026 Action_times=3653334 Epoche=2157\n",
      "Epsilon=0.696942 Action_times=3654558 Epoche=2158\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.696874 Action_times=3655547 Epoche=2159\n",
      "Epsilon=0.696743 Action_times=3657442 Epoche=2160\n",
      "Epsilon=0.696631 Action_times=3659073 Epoche=2161\n",
      "Epsilon=0.696528 Action_times=3660578 Epoche=2162\n",
      "Epsilon=0.696446 Action_times=3661767 Epoche=2163\n",
      "Epsilon=0.696339 Action_times=3663328 Epoche=2164\n",
      "Epsilon=0.696201 Action_times=3665349 Epoche=2165\n",
      "Epsilon=0.696089 Action_times=3666972 Epoche=2166\n",
      "Epsilon=0.696018 Action_times=3668010 Epoche=2167\n",
      "Epsilon=0.695953 Action_times=3668961 Epoche=2168\n",
      "Epsilon=0.695934 Action_times=3669236 Epoche=2169\n",
      "Epsilon=0.695893 Action_times=3669828 Epoche=2170\n",
      "Epsilon=0.695802 Action_times=3671159 Epoche=2171\n",
      "Epsilon=0.695776 Action_times=3671542 Epoche=2172\n",
      "Epsilon=0.695717 Action_times=3672397 Epoche=2173\n",
      "Epsilon=0.695690 Action_times=3672795 Epoche=2174\n",
      "Epsilon=0.695651 Action_times=3673359 Epoche=2175\n",
      "Epsilon=0.695621 Action_times=3673796 Epoche=2176\n",
      "Epsilon=0.695451 Action_times=3676274 Epoche=2177\n",
      "Epsilon=0.695400 Action_times=3677022 Epoche=2178\n",
      "Epsilon=0.695279 Action_times=3678788 Epoche=2179\n",
      "Epsilon=0.695196 Action_times=3679996 Epoche=2180\n",
      "Epsilon=0.695053 Action_times=3682093 Epoche=2181\n",
      "Epsilon=0.695032 Action_times=3682393 Epoche=2182\n",
      "Epsilon=0.694925 Action_times=3683950 Epoche=2183\n",
      "Epsilon=0.694868 Action_times=3684792 Epoche=2184\n",
      "Epsilon=0.694800 Action_times=3685786 Epoche=2185\n",
      "Epsilon=0.694656 Action_times=3687886 Epoche=2186\n",
      "Epsilon=0.694597 Action_times=3688739 Epoche=2187\n",
      "Epsilon=0.694478 Action_times=3690490 Epoche=2188\n",
      "Epsilon=0.694391 Action_times=3691751 Epoche=2189\n",
      "Epsilon=0.694359 Action_times=3692224 Epoche=2190\n",
      "Epsilon=0.694305 Action_times=3693008 Epoche=2191\n",
      "Epsilon=0.694228 Action_times=3694133 Epoche=2192\n",
      "Epsilon=0.694206 Action_times=3694452 Epoche=2193\n",
      "Epsilon=0.694161 Action_times=3695123 Epoche=2194\n",
      "Epsilon=0.694048 Action_times=3696768 Epoche=2195\n",
      "Epsilon=0.693979 Action_times=3697780 Epoche=2196\n",
      "Epsilon=0.693946 Action_times=3698253 Epoche=2197\n",
      "Epsilon=0.693912 Action_times=3698764 Epoche=2198\n",
      "Epsilon=0.693850 Action_times=3699666 Epoche=2199\n",
      "Epsilon=0.693766 Action_times=3700889 Epoche=2200\n",
      "Epsilon=0.693701 Action_times=3701843 Epoche=2201\n",
      "Epsilon=0.693623 Action_times=3702978 Epoche=2202\n",
      "Epsilon=0.693540 Action_times=3704200 Epoche=2203\n",
      "Epsilon=0.693438 Action_times=3705685 Epoche=2204\n",
      "Epsilon=0.693344 Action_times=3707061 Epoche=2205\n",
      "Epsilon=0.693268 Action_times=3708175 Epoche=2206\n",
      "Epsilon=0.693214 Action_times=3708966 Epoche=2207\n",
      "Epsilon=0.693086 Action_times=3710837 Epoche=2208\n",
      "Epsilon=0.692931 Action_times=3713109 Epoche=2209\n",
      "Epsilon=0.692853 Action_times=3714252 Epoche=2210\n",
      "Epsilon=0.692647 Action_times=3717264 Epoche=2211\n",
      "Epsilon=0.692566 Action_times=3718452 Epoche=2212\n",
      "Epsilon=0.692479 Action_times=3719727 Epoche=2213\n",
      "Epsilon=0.692411 Action_times=3720730 Epoche=2214\n",
      "Epsilon=0.692346 Action_times=3721681 Epoche=2215\n",
      "Epsilon=0.692204 Action_times=3723762 Epoche=2216\n",
      "Epsilon=0.692136 Action_times=3724756 Epoche=2217\n",
      "Epsilon=0.692085 Action_times=3725510 Epoche=2218\n",
      "Epsilon=0.692030 Action_times=3726313 Epoche=2219\n",
      "Epsilon=0.691940 Action_times=3727633 Epoche=2220\n",
      "Epsilon=0.691917 Action_times=3727972 Epoche=2221\n",
      "Epsilon=0.691872 Action_times=3728637 Epoche=2222\n",
      "Epsilon=0.691805 Action_times=3729618 Epoche=2223\n",
      "Epsilon=0.691727 Action_times=3730754 Epoche=2224\n",
      "Epsilon=0.691701 Action_times=3731145 Epoche=2225\n",
      "Epsilon=0.691623 Action_times=3732281 Epoche=2226\n",
      "Epsilon=0.691590 Action_times=3732762 Epoche=2227\n",
      "Epsilon=0.691537 Action_times=3733542 Epoche=2228\n",
      "Epsilon=0.691465 Action_times=3734597 Epoche=2229\n",
      "Epsilon=0.691408 Action_times=3735437 Epoche=2230\n",
      "Epsilon=0.691352 Action_times=3736255 Epoche=2231\n",
      "Epsilon=0.691292 Action_times=3737144 Epoche=2232\n",
      "Epsilon=0.691208 Action_times=3738369 Epoche=2233\n",
      "Epsilon=0.691137 Action_times=3739417 Epoche=2234\n",
      "Epsilon=0.691043 Action_times=3740799 Epoche=2235\n",
      "Epsilon=0.690990 Action_times=3741571 Epoche=2236\n",
      "Epsilon=0.690880 Action_times=3743189 Epoche=2237\n",
      "Epsilon=0.690809 Action_times=3744231 Epoche=2238\n",
      "Epsilon=0.690764 Action_times=3744889 Epoche=2239\n",
      "Epsilon=0.690698 Action_times=3745857 Epoche=2240\n",
      "Epsilon=0.690642 Action_times=3746685 Epoche=2241\n",
      "Epsilon=0.690557 Action_times=3747935 Epoche=2242\n",
      "Epsilon=0.690520 Action_times=3748476 Epoche=2243\n",
      "Epsilon=0.690505 Action_times=3748693 Epoche=2244\n",
      "Epsilon=0.690459 Action_times=3749372 Epoche=2245\n",
      "Epsilon=0.690429 Action_times=3749818 Epoche=2246\n",
      "Epsilon=0.690325 Action_times=3751337 Epoche=2247\n",
      "Epsilon=0.690229 Action_times=3752752 Epoche=2248\n",
      "Epsilon=0.690098 Action_times=3754681 Epoche=2249\n",
      "Epsilon=0.690079 Action_times=3754961 Epoche=2250\n",
      "Epsilon=0.689997 Action_times=3756160 Epoche=2251\n",
      "Epsilon=0.689975 Action_times=3756487 Epoche=2252\n",
      "Epsilon=0.689858 Action_times=3758215 Epoche=2253\n",
      "Epsilon=0.689857 Action_times=3758229 Epoche=2254\n",
      "Epsilon=0.689807 Action_times=3758955 Epoche=2255\n",
      "Epsilon=0.689678 Action_times=3760864 Epoche=2256\n",
      "Epsilon=0.689595 Action_times=3762080 Epoche=2257\n",
      "Epsilon=0.689519 Action_times=3763196 Epoche=2258\n",
      "Epsilon=0.689431 Action_times=3764494 Epoche=2259\n",
      "Epsilon=0.689378 Action_times=3765270 Epoche=2260\n",
      "Epsilon=0.689324 Action_times=3766062 Epoche=2261\n",
      "Epsilon=0.689285 Action_times=3766636 Epoche=2262\n",
      "Epsilon=0.689225 Action_times=3767528 Epoche=2263\n",
      "Epsilon=0.689129 Action_times=3768944 Epoche=2264\n",
      "Epsilon=0.689090 Action_times=3769512 Epoche=2265\n",
      "Epsilon=0.689043 Action_times=3770208 Epoche=2266\n",
      "Epsilon=0.688975 Action_times=3771211 Epoche=2267\n",
      "Epsilon=0.688949 Action_times=3771586 Epoche=2268\n",
      "Epsilon=0.688912 Action_times=3772139 Epoche=2269\n",
      "Epsilon=0.688831 Action_times=3773326 Epoche=2270\n",
      "Epsilon=0.688796 Action_times=3773838 Epoche=2271\n",
      "Epsilon=0.688780 Action_times=3774072 Epoche=2272\n",
      "Epsilon=0.688756 Action_times=3774439 Epoche=2273\n",
      "Epsilon=0.688720 Action_times=3774961 Epoche=2274\n",
      "Epsilon=0.688665 Action_times=3775778 Epoche=2275\n",
      "Epsilon=0.688582 Action_times=3776999 Epoche=2276\n",
      "Epsilon=0.688565 Action_times=3777250 Epoche=2277\n",
      "Epsilon=0.688503 Action_times=3778159 Epoche=2278\n",
      "Epsilon=0.688461 Action_times=3778774 Epoche=2279\n",
      "Epsilon=0.688458 Action_times=3778822 Epoche=2280\n",
      "Epsilon=0.688434 Action_times=3779171 Epoche=2281\n",
      "Epsilon=0.688386 Action_times=3779880 Epoche=2282\n",
      "Epsilon=0.688374 Action_times=3780064 Epoche=2283\n",
      "Epsilon=0.688336 Action_times=3780616 Epoche=2284\n",
      "Epsilon=0.688267 Action_times=3781643 Epoche=2285\n",
      "Epsilon=0.688159 Action_times=3783232 Epoche=2286\n",
      "Epsilon=0.688085 Action_times=3784320 Epoche=2287\n",
      "Epsilon=0.687897 Action_times=3787092 Epoche=2288\n",
      "Epsilon=0.687648 Action_times=3790767 Epoche=2289\n",
      "Epsilon=0.687496 Action_times=3793008 Epoche=2290\n",
      "Epsilon=0.687321 Action_times=3795593 Epoche=2291\n",
      "Epsilon=0.687279 Action_times=3796220 Epoche=2292\n",
      "Epsilon=0.687262 Action_times=3796474 Epoche=2293\n",
      "Epsilon=0.687147 Action_times=3798170 Epoche=2294\n",
      "Epsilon=0.687095 Action_times=3798930 Epoche=2295\n",
      "Epsilon=0.686971 Action_times=3800766 Epoche=2296\n",
      "Epsilon=0.686924 Action_times=3801463 Epoche=2297\n",
      "Epsilon=0.686794 Action_times=3803381 Epoche=2298\n",
      "Epsilon=0.686764 Action_times=3803824 Epoche=2299\n",
      "Epsilon=0.686732 Action_times=3804299 Epoche=2300\n",
      "Epsilon=0.686665 Action_times=3805283 Epoche=2301\n",
      "Epsilon=0.686647 Action_times=3805548 Epoche=2302\n",
      "Epsilon=0.686583 Action_times=3806505 Epoche=2303\n",
      "Epsilon=0.686525 Action_times=3807357 Epoche=2304\n",
      "Epsilon=0.686464 Action_times=3808261 Epoche=2305\n",
      "Epsilon=0.686400 Action_times=3809209 Epoche=2306\n",
      "Epsilon=0.686292 Action_times=3810804 Epoche=2307\n",
      "Epsilon=0.686284 Action_times=3810917 Epoche=2308\n",
      "Epsilon=0.686136 Action_times=3813107 Epoche=2309\n",
      "Epsilon=0.686054 Action_times=3814313 Epoche=2310\n",
      "Epsilon=0.685910 Action_times=3816451 Epoche=2311\n",
      "Epsilon=0.685805 Action_times=3818001 Epoche=2312\n",
      "Epsilon=0.685720 Action_times=3819265 Epoche=2313\n",
      "Epsilon=0.685623 Action_times=3820690 Epoche=2314\n",
      "Epsilon=0.685600 Action_times=3821031 Epoche=2315\n",
      "Epsilon=0.685542 Action_times=3821900 Epoche=2316\n",
      "Epsilon=0.685449 Action_times=3823273 Epoche=2317\n",
      "Epsilon=0.685371 Action_times=3824433 Epoche=2318\n",
      "Epsilon=0.685267 Action_times=3825962 Epoche=2319\n",
      "Epsilon=0.685205 Action_times=3826887 Epoche=2320\n",
      "Epsilon=0.685072 Action_times=3828853 Epoche=2321\n",
      "Epsilon=0.685053 Action_times=3829133 Epoche=2322\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.685028 Action_times=3829510 Epoche=2323\n",
      "Epsilon=0.684996 Action_times=3829987 Epoche=2324\n",
      "Epsilon=0.684935 Action_times=3830880 Epoche=2325\n",
      "Epsilon=0.684896 Action_times=3831468 Epoche=2326\n",
      "Epsilon=0.684781 Action_times=3833170 Epoche=2327\n",
      "Epsilon=0.684701 Action_times=3834346 Epoche=2328\n",
      "Epsilon=0.684615 Action_times=3835631 Epoche=2329\n",
      "Epsilon=0.684558 Action_times=3836467 Epoche=2330\n",
      "Epsilon=0.684282 Action_times=3840568 Epoche=2331\n",
      "Epsilon=0.684153 Action_times=3842472 Epoche=2332\n",
      "Epsilon=0.684083 Action_times=3843524 Epoche=2333\n",
      "Epsilon=0.684049 Action_times=3844026 Epoche=2334\n",
      "Epsilon=0.683992 Action_times=3844864 Epoche=2335\n",
      "Epsilon=0.683874 Action_times=3846621 Epoche=2336\n",
      "Epsilon=0.683832 Action_times=3847242 Epoche=2337\n",
      "Epsilon=0.683717 Action_times=3848943 Epoche=2338\n",
      "Epsilon=0.683610 Action_times=3850533 Epoche=2339\n",
      "Epsilon=0.683531 Action_times=3851716 Epoche=2340\n",
      "Epsilon=0.683399 Action_times=3853663 Epoche=2341\n",
      "Epsilon=0.683126 Action_times=3857717 Epoche=2342\n",
      "Epsilon=0.683116 Action_times=3857868 Epoche=2343\n",
      "Epsilon=0.683094 Action_times=3858199 Epoche=2344\n",
      "Epsilon=0.683042 Action_times=3858965 Epoche=2345\n",
      "Epsilon=0.682941 Action_times=3860467 Epoche=2346\n",
      "Epsilon=0.682927 Action_times=3860682 Epoche=2347\n",
      "Epsilon=0.682817 Action_times=3862309 Epoche=2348\n",
      "Epsilon=0.682652 Action_times=3864762 Epoche=2349\n",
      "Epsilon=0.682431 Action_times=3868054 Epoche=2350\n",
      "Epsilon=0.682320 Action_times=3869708 Epoche=2351\n",
      "Epsilon=0.682293 Action_times=3870104 Epoche=2352\n",
      "Epsilon=0.682248 Action_times=3870783 Epoche=2353\n",
      "Epsilon=0.682187 Action_times=3871679 Epoche=2354\n",
      "Epsilon=0.682060 Action_times=3873574 Epoche=2355\n",
      "Epsilon=0.681949 Action_times=3875222 Epoche=2356\n",
      "Epsilon=0.681823 Action_times=3877099 Epoche=2357\n",
      "Epsilon=0.681763 Action_times=3877988 Epoche=2358\n",
      "Epsilon=0.681600 Action_times=3880425 Epoche=2359\n",
      "Epsilon=0.681444 Action_times=3882742 Epoche=2360\n",
      "Epsilon=0.681352 Action_times=3884114 Epoche=2361\n",
      "Epsilon=0.681232 Action_times=3885903 Epoche=2362\n",
      "Epsilon=0.681173 Action_times=3886784 Epoche=2363\n",
      "Epsilon=0.680978 Action_times=3889687 Epoche=2364\n",
      "Epsilon=0.680835 Action_times=3891810 Epoche=2365\n",
      "Epsilon=0.680711 Action_times=3893663 Epoche=2366\n",
      "Epsilon=0.680645 Action_times=3894650 Epoche=2367\n",
      "Epsilon=0.680497 Action_times=3896856 Epoche=2368\n",
      "Epsilon=0.680460 Action_times=3897412 Epoche=2369\n",
      "Epsilon=0.680400 Action_times=3898308 Epoche=2370\n",
      "Epsilon=0.680312 Action_times=3899612 Epoche=2371\n",
      "Epsilon=0.680278 Action_times=3900119 Epoche=2372\n",
      "Epsilon=0.680213 Action_times=3901094 Epoche=2373\n",
      "Epsilon=0.680109 Action_times=3902641 Epoche=2374\n",
      "Epsilon=0.680017 Action_times=3904013 Epoche=2375\n",
      "Epsilon=0.679969 Action_times=3904732 Epoche=2376\n",
      "Epsilon=0.679880 Action_times=3906065 Epoche=2377\n",
      "Epsilon=0.679808 Action_times=3907133 Epoche=2378\n",
      "Epsilon=0.679696 Action_times=3908816 Epoche=2379\n",
      "Epsilon=0.679675 Action_times=3909127 Epoche=2380\n",
      "Epsilon=0.679559 Action_times=3910852 Epoche=2381\n",
      "Epsilon=0.679457 Action_times=3912385 Epoche=2382\n",
      "Epsilon=0.679425 Action_times=3912853 Epoche=2383\n",
      "Epsilon=0.679275 Action_times=3915096 Epoche=2384\n",
      "Epsilon=0.679151 Action_times=3916949 Epoche=2385\n",
      "Epsilon=0.679097 Action_times=3917754 Epoche=2386\n",
      "Epsilon=0.679049 Action_times=3918469 Epoche=2387\n",
      "Epsilon=0.679012 Action_times=3919036 Epoche=2388\n",
      "Epsilon=0.678941 Action_times=3920090 Epoche=2389\n",
      "Epsilon=0.678866 Action_times=3921215 Epoche=2390\n",
      "Epsilon=0.678835 Action_times=3921669 Epoche=2391\n",
      "Epsilon=0.678741 Action_times=3923084 Epoche=2392\n",
      "Epsilon=0.678644 Action_times=3924533 Epoche=2393\n",
      "Epsilon=0.678549 Action_times=3925948 Epoche=2394\n",
      "Epsilon=0.678446 Action_times=3927489 Epoche=2395\n",
      "Epsilon=0.678425 Action_times=3927814 Epoche=2396\n",
      "Epsilon=0.678362 Action_times=3928748 Epoche=2397\n",
      "Epsilon=0.678321 Action_times=3929361 Epoche=2398\n",
      "Epsilon=0.678265 Action_times=3930195 Epoche=2399\n",
      "Epsilon=0.678136 Action_times=3932126 Epoche=2400\n",
      "Epsilon=0.677957 Action_times=3934813 Epoche=2401\n",
      "Epsilon=0.677778 Action_times=3937488 Epoche=2402\n",
      "Epsilon=0.677674 Action_times=3939052 Epoche=2403\n",
      "Epsilon=0.677584 Action_times=3940396 Epoche=2404\n",
      "Epsilon=0.677542 Action_times=3941028 Epoche=2405\n",
      "Epsilon=0.677505 Action_times=3941579 Epoche=2406\n",
      "Epsilon=0.677407 Action_times=3943056 Epoche=2407\n",
      "Epsilon=0.677382 Action_times=3943420 Epoche=2408\n",
      "Epsilon=0.677336 Action_times=3944111 Epoche=2409\n",
      "Epsilon=0.677299 Action_times=3944667 Epoche=2410\n",
      "Epsilon=0.677200 Action_times=3946146 Epoche=2411\n",
      "Epsilon=0.677173 Action_times=3946560 Epoche=2412\n",
      "Epsilon=0.677135 Action_times=3947119 Epoche=2413\n",
      "Epsilon=0.677064 Action_times=3948196 Epoche=2414\n",
      "Epsilon=0.677024 Action_times=3948782 Epoche=2415\n",
      "Epsilon=0.676979 Action_times=3949458 Epoche=2416\n",
      "Epsilon=0.676854 Action_times=3951336 Epoche=2417\n",
      "Epsilon=0.676846 Action_times=3951454 Epoche=2418\n",
      "Epsilon=0.676758 Action_times=3952777 Epoche=2419\n",
      "Epsilon=0.676594 Action_times=3955242 Epoche=2420\n",
      "Epsilon=0.676580 Action_times=3955445 Epoche=2421\n",
      "Epsilon=0.676572 Action_times=3955571 Epoche=2422\n",
      "Epsilon=0.676548 Action_times=3955933 Epoche=2423\n",
      "Epsilon=0.676448 Action_times=3957422 Epoche=2424\n",
      "Epsilon=0.676365 Action_times=3958672 Epoche=2425\n",
      "Epsilon=0.676286 Action_times=3959855 Epoche=2426\n",
      "Epsilon=0.676248 Action_times=3960435 Epoche=2427\n",
      "Epsilon=0.676204 Action_times=3961090 Epoche=2428\n",
      "Epsilon=0.676134 Action_times=3962135 Epoche=2429\n",
      "Epsilon=0.676071 Action_times=3963087 Epoche=2430\n",
      "Epsilon=0.675932 Action_times=3965175 Epoche=2431\n",
      "Epsilon=0.675839 Action_times=3966576 Epoche=2432\n",
      "Epsilon=0.675780 Action_times=3967463 Epoche=2433\n",
      "Epsilon=0.675703 Action_times=3968611 Epoche=2434\n",
      "Epsilon=0.675677 Action_times=3969009 Epoche=2435\n",
      "Epsilon=0.675531 Action_times=3971193 Epoche=2436\n",
      "Epsilon=0.675513 Action_times=3971470 Epoche=2437\n",
      "Epsilon=0.675462 Action_times=3972240 Epoche=2438\n",
      "Epsilon=0.675441 Action_times=3972556 Epoche=2439\n",
      "Epsilon=0.675409 Action_times=3973028 Epoche=2440\n",
      "Epsilon=0.675371 Action_times=3973595 Epoche=2441\n",
      "Epsilon=0.675276 Action_times=3975025 Epoche=2442\n",
      "Epsilon=0.675160 Action_times=3976780 Epoche=2443\n",
      "Epsilon=0.675122 Action_times=3977341 Epoche=2444\n",
      "Epsilon=0.675047 Action_times=3978479 Epoche=2445\n",
      "Epsilon=0.674998 Action_times=3979205 Epoche=2446\n",
      "Epsilon=0.674936 Action_times=3980146 Epoche=2447\n",
      "Epsilon=0.674877 Action_times=3981036 Epoche=2448\n",
      "Epsilon=0.674845 Action_times=3981508 Epoche=2449\n",
      "Epsilon=0.674797 Action_times=3982237 Epoche=2450\n",
      "Epsilon=0.674776 Action_times=3982548 Epoche=2451\n",
      "Epsilon=0.674702 Action_times=3983655 Epoche=2452\n",
      "Epsilon=0.674665 Action_times=3984217 Epoche=2453\n",
      "Epsilon=0.674651 Action_times=3984422 Epoche=2454\n",
      "Epsilon=0.674534 Action_times=3986186 Epoche=2455\n",
      "Epsilon=0.674496 Action_times=3986763 Epoche=2456\n",
      "Epsilon=0.674488 Action_times=3986888 Epoche=2457\n",
      "Epsilon=0.674439 Action_times=3987616 Epoche=2458\n",
      "Epsilon=0.674362 Action_times=3988781 Epoche=2459\n",
      "Epsilon=0.674310 Action_times=3989557 Epoche=2460\n",
      "Epsilon=0.674192 Action_times=3991336 Epoche=2461\n",
      "Epsilon=0.674154 Action_times=3991916 Epoche=2462\n",
      "Epsilon=0.674099 Action_times=3992741 Epoche=2463\n",
      "Epsilon=0.674019 Action_times=3993941 Epoche=2464\n",
      "Epsilon=0.673981 Action_times=3994518 Epoche=2465\n",
      "Epsilon=0.673907 Action_times=3995628 Epoche=2466\n",
      "Epsilon=0.673865 Action_times=3996268 Epoche=2467\n",
      "Epsilon=0.673838 Action_times=3996673 Epoche=2468\n",
      "Epsilon=0.673801 Action_times=3997222 Epoche=2469\n",
      "Epsilon=0.673749 Action_times=3998016 Epoche=2470\n",
      "Epsilon=0.673661 Action_times=3999338 Epoche=2471\n",
      "Epsilon=0.673504 Action_times=4001703 Epoche=2472\n",
      "Epsilon=0.673485 Action_times=4001990 Epoche=2473\n",
      "Epsilon=0.673389 Action_times=4003430 Epoche=2474\n",
      "Epsilon=0.673325 Action_times=4004403 Epoche=2475\n",
      "Epsilon=0.673288 Action_times=4004963 Epoche=2476\n",
      "Epsilon=0.673265 Action_times=4005300 Epoche=2477\n",
      "Epsilon=0.673209 Action_times=4006154 Epoche=2478\n",
      "Epsilon=0.673124 Action_times=4007423 Epoche=2479\n",
      "Epsilon=0.673068 Action_times=4008267 Epoche=2480\n",
      "Epsilon=0.673003 Action_times=4009249 Epoche=2481\n",
      "Epsilon=0.672961 Action_times=4009889 Epoche=2482\n",
      "Epsilon=0.672922 Action_times=4010469 Epoche=2483\n",
      "Epsilon=0.672855 Action_times=4011484 Epoche=2484\n",
      "Epsilon=0.672784 Action_times=4012558 Epoche=2485\n",
      "Epsilon=0.672728 Action_times=4013403 Epoche=2486\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.672616 Action_times=4015087 Epoche=2487\n",
      "Epsilon=0.672585 Action_times=4015563 Epoche=2488\n",
      "Epsilon=0.672419 Action_times=4018072 Epoche=2489\n",
      "Epsilon=0.672385 Action_times=4018573 Epoche=2490\n",
      "Epsilon=0.672296 Action_times=4019920 Epoche=2491\n",
      "Epsilon=0.672162 Action_times=4021942 Epoche=2492\n",
      "Epsilon=0.672123 Action_times=4022531 Epoche=2493\n",
      "Epsilon=0.672046 Action_times=4023703 Epoche=2494\n",
      "Epsilon=0.671993 Action_times=4024498 Epoche=2495\n",
      "Epsilon=0.671902 Action_times=4025880 Epoche=2496\n",
      "Epsilon=0.671807 Action_times=4027306 Epoche=2497\n",
      "Epsilon=0.671693 Action_times=4029033 Epoche=2498\n",
      "Epsilon=0.671638 Action_times=4029868 Epoche=2499\n",
      "Epsilon=0.671518 Action_times=4031678 Epoche=2500\n",
      "Epsilon=0.671450 Action_times=4032701 Epoche=2501\n",
      "Epsilon=0.671397 Action_times=4033510 Epoche=2502\n",
      "Epsilon=0.671258 Action_times=4035614 Epoche=2503\n",
      "Epsilon=0.671170 Action_times=4036935 Epoche=2504\n",
      "Epsilon=0.671012 Action_times=4039334 Epoche=2505\n",
      "Epsilon=0.670910 Action_times=4040867 Epoche=2506\n",
      "Epsilon=0.670702 Action_times=4044026 Epoche=2507\n",
      "Epsilon=0.670628 Action_times=4045135 Epoche=2508\n",
      "Epsilon=0.670523 Action_times=4046724 Epoche=2509\n",
      "Epsilon=0.670510 Action_times=4046933 Epoche=2510\n",
      "Epsilon=0.670456 Action_times=4047740 Epoche=2511\n",
      "Epsilon=0.670344 Action_times=4049433 Epoche=2512\n",
      "Epsilon=0.670278 Action_times=4050444 Epoche=2513\n",
      "Epsilon=0.670102 Action_times=4053109 Epoche=2514\n",
      "Epsilon=0.670034 Action_times=4054136 Epoche=2515\n",
      "Epsilon=0.670031 Action_times=4054179 Epoche=2516\n",
      "Epsilon=0.669944 Action_times=4055502 Epoche=2517\n",
      "Epsilon=0.669854 Action_times=4056861 Epoche=2518\n",
      "Epsilon=0.669801 Action_times=4057667 Epoche=2519\n",
      "Epsilon=0.669737 Action_times=4058633 Epoche=2520\n",
      "Epsilon=0.669702 Action_times=4059165 Epoche=2521\n",
      "Epsilon=0.669581 Action_times=4060997 Epoche=2522\n",
      "Epsilon=0.669528 Action_times=4061801 Epoche=2523\n",
      "Epsilon=0.669454 Action_times=4062934 Epoche=2524\n",
      "Epsilon=0.669412 Action_times=4063567 Epoche=2525\n",
      "Epsilon=0.669334 Action_times=4064752 Epoche=2526\n",
      "Epsilon=0.669280 Action_times=4065565 Epoche=2527\n",
      "Epsilon=0.669206 Action_times=4066691 Epoche=2528\n",
      "Epsilon=0.669130 Action_times=4067842 Epoche=2529\n",
      "Epsilon=0.669035 Action_times=4069285 Epoche=2530\n",
      "Epsilon=0.669008 Action_times=4069690 Epoche=2531\n",
      "Epsilon=0.668926 Action_times=4070932 Epoche=2532\n",
      "Epsilon=0.668843 Action_times=4072198 Epoche=2533\n",
      "Epsilon=0.668770 Action_times=4073311 Epoche=2534\n",
      "Epsilon=0.668663 Action_times=4074932 Epoche=2535\n",
      "Epsilon=0.668518 Action_times=4077134 Epoche=2536\n",
      "Epsilon=0.668484 Action_times=4077653 Epoche=2537\n",
      "Epsilon=0.668407 Action_times=4078824 Epoche=2538\n",
      "Epsilon=0.668362 Action_times=4079495 Epoche=2539\n",
      "Epsilon=0.668323 Action_times=4080090 Epoche=2540\n",
      "Epsilon=0.668249 Action_times=4081224 Epoche=2541\n",
      "Epsilon=0.668187 Action_times=4082166 Epoche=2542\n",
      "Epsilon=0.668149 Action_times=4082741 Epoche=2543\n",
      "Epsilon=0.668131 Action_times=4083002 Epoche=2544\n",
      "Epsilon=0.668067 Action_times=4083987 Epoche=2545\n",
      "Epsilon=0.667973 Action_times=4085416 Epoche=2546\n",
      "Epsilon=0.667956 Action_times=4085674 Epoche=2547\n",
      "Epsilon=0.667879 Action_times=4086834 Epoche=2548\n",
      "Epsilon=0.667760 Action_times=4088650 Epoche=2549\n",
      "Epsilon=0.667683 Action_times=4089818 Epoche=2550\n",
      "Epsilon=0.667661 Action_times=4090151 Epoche=2551\n",
      "Epsilon=0.667618 Action_times=4090803 Epoche=2552\n",
      "Epsilon=0.667575 Action_times=4091465 Epoche=2553\n",
      "Epsilon=0.667505 Action_times=4092532 Epoche=2554\n",
      "Epsilon=0.667439 Action_times=4093528 Epoche=2555\n",
      "Epsilon=0.667433 Action_times=4093622 Epoche=2556\n",
      "Epsilon=0.667378 Action_times=4094455 Epoche=2557\n",
      "Epsilon=0.667357 Action_times=4094782 Epoche=2558\n",
      "Epsilon=0.667266 Action_times=4096157 Epoche=2559\n",
      "Epsilon=0.667246 Action_times=4096469 Epoche=2560\n",
      "Epsilon=0.667177 Action_times=4097516 Epoche=2561\n",
      "Epsilon=0.667013 Action_times=4100006 Epoche=2562\n",
      "Epsilon=0.666920 Action_times=4101431 Epoche=2563\n",
      "Epsilon=0.666866 Action_times=4102246 Epoche=2564\n",
      "Epsilon=0.666832 Action_times=4102762 Epoche=2565\n",
      "Epsilon=0.666742 Action_times=4104142 Epoche=2566\n",
      "Epsilon=0.666736 Action_times=4104225 Epoche=2567\n",
      "Epsilon=0.666684 Action_times=4105022 Epoche=2568\n",
      "Epsilon=0.666599 Action_times=4106321 Epoche=2569\n",
      "Epsilon=0.666517 Action_times=4107561 Epoche=2570\n",
      "Epsilon=0.666465 Action_times=4108358 Epoche=2571\n",
      "Epsilon=0.666423 Action_times=4108998 Epoche=2572\n",
      "Epsilon=0.666347 Action_times=4110146 Epoche=2573\n",
      "Epsilon=0.666244 Action_times=4111724 Epoche=2574\n",
      "Epsilon=0.666220 Action_times=4112093 Epoche=2575\n",
      "Epsilon=0.666173 Action_times=4112799 Epoche=2576\n",
      "Epsilon=0.666048 Action_times=4114717 Epoche=2577\n",
      "Epsilon=0.665947 Action_times=4116252 Epoche=2578\n",
      "Epsilon=0.665907 Action_times=4116856 Epoche=2579\n",
      "Epsilon=0.665858 Action_times=4117605 Epoche=2580\n",
      "Epsilon=0.665801 Action_times=4118474 Epoche=2581\n",
      "Epsilon=0.665762 Action_times=4119077 Epoche=2582\n",
      "Epsilon=0.665756 Action_times=4119164 Epoche=2583\n",
      "Epsilon=0.665702 Action_times=4119986 Epoche=2584\n",
      "Epsilon=0.665600 Action_times=4121540 Epoche=2585\n",
      "Epsilon=0.665528 Action_times=4122636 Epoche=2586\n",
      "Epsilon=0.665443 Action_times=4123942 Epoche=2587\n",
      "Epsilon=0.665247 Action_times=4126925 Epoche=2588\n",
      "Epsilon=0.665152 Action_times=4128370 Epoche=2589\n",
      "Epsilon=0.665078 Action_times=4129501 Epoche=2590\n",
      "Epsilon=0.665034 Action_times=4130179 Epoche=2591\n",
      "Epsilon=0.664986 Action_times=4130913 Epoche=2592\n",
      "Epsilon=0.664932 Action_times=4131728 Epoche=2593\n",
      "Epsilon=0.664811 Action_times=4133584 Epoche=2594\n",
      "Epsilon=0.664790 Action_times=4133899 Epoche=2595\n",
      "Epsilon=0.664765 Action_times=4134282 Epoche=2596\n",
      "Epsilon=0.664683 Action_times=4135532 Epoche=2597\n",
      "Epsilon=0.664651 Action_times=4136028 Epoche=2598\n",
      "Epsilon=0.664574 Action_times=4137206 Epoche=2599\n",
      "Epsilon=0.664518 Action_times=4138051 Epoche=2600\n",
      "Epsilon=0.664493 Action_times=4138435 Epoche=2601\n",
      "Epsilon=0.664410 Action_times=4139709 Epoche=2602\n",
      "Epsilon=0.664362 Action_times=4140438 Epoche=2603\n",
      "Epsilon=0.664324 Action_times=4141019 Epoche=2604\n",
      "Epsilon=0.664314 Action_times=4141179 Epoche=2605\n",
      "Epsilon=0.664231 Action_times=4142452 Epoche=2606\n",
      "Epsilon=0.664050 Action_times=4145214 Epoche=2607\n",
      "Epsilon=0.664047 Action_times=4145252 Epoche=2608\n",
      "Epsilon=0.663922 Action_times=4147172 Epoche=2609\n",
      "Epsilon=0.663848 Action_times=4148297 Epoche=2610\n",
      "Epsilon=0.663741 Action_times=4149940 Epoche=2611\n",
      "Epsilon=0.663646 Action_times=4151383 Epoche=2612\n",
      "Epsilon=0.663568 Action_times=4152587 Epoche=2613\n",
      "Epsilon=0.663505 Action_times=4153553 Epoche=2614\n",
      "Epsilon=0.663441 Action_times=4154523 Epoche=2615\n",
      "Epsilon=0.663440 Action_times=4154544 Epoche=2616\n",
      "Epsilon=0.663334 Action_times=4156165 Epoche=2617\n",
      "Epsilon=0.663248 Action_times=4157480 Epoche=2618\n",
      "Epsilon=0.663128 Action_times=4159317 Epoche=2619\n",
      "Epsilon=0.663061 Action_times=4160346 Epoche=2620\n",
      "Epsilon=0.663016 Action_times=4161033 Epoche=2621\n",
      "Epsilon=0.662935 Action_times=4162273 Epoche=2622\n",
      "Epsilon=0.662868 Action_times=4163303 Epoche=2623\n",
      "Epsilon=0.662758 Action_times=4164979 Epoche=2624\n",
      "Epsilon=0.662678 Action_times=4166213 Epoche=2625\n",
      "Epsilon=0.662674 Action_times=4166275 Epoche=2626\n",
      "Epsilon=0.662610 Action_times=4167250 Epoche=2627\n",
      "Epsilon=0.662553 Action_times=4168127 Epoche=2628\n",
      "Epsilon=0.662468 Action_times=4169433 Epoche=2629\n",
      "Epsilon=0.662455 Action_times=4169633 Epoche=2630\n",
      "Epsilon=0.662425 Action_times=4170094 Epoche=2631\n",
      "Epsilon=0.662345 Action_times=4171318 Epoche=2632\n",
      "Epsilon=0.662306 Action_times=4171904 Epoche=2633\n",
      "Epsilon=0.662273 Action_times=4172411 Epoche=2634\n",
      "Epsilon=0.662246 Action_times=4172827 Epoche=2635\n",
      "Epsilon=0.662180 Action_times=4173844 Epoche=2636\n",
      "Epsilon=0.662122 Action_times=4174728 Epoche=2637\n",
      "Epsilon=0.662040 Action_times=4175989 Epoche=2638\n",
      "Epsilon=0.661996 Action_times=4176672 Epoche=2639\n",
      "Epsilon=0.661990 Action_times=4176751 Epoche=2640\n",
      "Epsilon=0.661863 Action_times=4178712 Epoche=2641\n",
      "Epsilon=0.661780 Action_times=4179972 Epoche=2642\n",
      "Epsilon=0.661729 Action_times=4180766 Epoche=2643\n",
      "Epsilon=0.661613 Action_times=4182540 Epoche=2644\n",
      "Epsilon=0.661561 Action_times=4183339 Epoche=2645\n",
      "Epsilon=0.661479 Action_times=4184601 Epoche=2646\n",
      "Epsilon=0.661450 Action_times=4185036 Epoche=2647\n",
      "Epsilon=0.661389 Action_times=4185986 Epoche=2648\n",
      "Epsilon=0.661307 Action_times=4187232 Epoche=2649\n",
      "Epsilon=0.661240 Action_times=4188262 Epoche=2650\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.661171 Action_times=4189322 Epoche=2651\n",
      "Epsilon=0.661123 Action_times=4190063 Epoche=2652\n",
      "Epsilon=0.660957 Action_times=4192614 Epoche=2653\n",
      "Epsilon=0.660891 Action_times=4193635 Epoche=2654\n",
      "Epsilon=0.660734 Action_times=4196042 Epoche=2655\n",
      "Epsilon=0.660661 Action_times=4197168 Epoche=2656\n",
      "Epsilon=0.660522 Action_times=4199304 Epoche=2657\n",
      "Epsilon=0.660384 Action_times=4201427 Epoche=2658\n",
      "Epsilon=0.660271 Action_times=4203160 Epoche=2659\n",
      "Epsilon=0.660174 Action_times=4204655 Epoche=2660\n",
      "Epsilon=0.659919 Action_times=4208567 Epoche=2661\n",
      "Epsilon=0.659807 Action_times=4210296 Epoche=2662\n",
      "Epsilon=0.659766 Action_times=4210927 Epoche=2663\n",
      "Epsilon=0.659745 Action_times=4211242 Epoche=2664\n",
      "Epsilon=0.659613 Action_times=4213285 Epoche=2665\n",
      "Epsilon=0.659526 Action_times=4214626 Epoche=2666\n",
      "Epsilon=0.659463 Action_times=4215585 Epoche=2667\n",
      "Epsilon=0.659370 Action_times=4217030 Epoche=2668\n",
      "Epsilon=0.659355 Action_times=4217251 Epoche=2669\n",
      "Epsilon=0.659315 Action_times=4217875 Epoche=2670\n",
      "Epsilon=0.659283 Action_times=4218369 Epoche=2671\n",
      "Epsilon=0.659256 Action_times=4218781 Epoche=2672\n",
      "Epsilon=0.659217 Action_times=4219383 Epoche=2673\n",
      "Epsilon=0.659147 Action_times=4220459 Epoche=2674\n",
      "Epsilon=0.659046 Action_times=4222020 Epoche=2675\n",
      "Epsilon=0.658940 Action_times=4223642 Epoche=2676\n",
      "Epsilon=0.658833 Action_times=4225302 Epoche=2677\n",
      "Epsilon=0.658777 Action_times=4226152 Epoche=2678\n",
      "Epsilon=0.658696 Action_times=4227411 Epoche=2679\n",
      "Epsilon=0.658621 Action_times=4228571 Epoche=2680\n",
      "Epsilon=0.658611 Action_times=4228711 Epoche=2681\n",
      "Epsilon=0.658578 Action_times=4229230 Epoche=2682\n",
      "Epsilon=0.658533 Action_times=4229922 Epoche=2683\n",
      "Epsilon=0.658515 Action_times=4230199 Epoche=2684\n",
      "Epsilon=0.658510 Action_times=4230276 Epoche=2685\n",
      "Epsilon=0.658495 Action_times=4230503 Epoche=2686\n",
      "Epsilon=0.658462 Action_times=4231022 Epoche=2687\n",
      "Epsilon=0.658414 Action_times=4231762 Epoche=2688\n",
      "Epsilon=0.658334 Action_times=4232983 Epoche=2689\n",
      "Epsilon=0.658296 Action_times=4233578 Epoche=2690\n",
      "Epsilon=0.658254 Action_times=4234223 Epoche=2691\n",
      "Epsilon=0.658217 Action_times=4234788 Epoche=2692\n",
      "Epsilon=0.658123 Action_times=4236245 Epoche=2693\n",
      "Epsilon=0.657997 Action_times=4238193 Epoche=2694\n",
      "Epsilon=0.657931 Action_times=4239206 Epoche=2695\n",
      "Epsilon=0.657894 Action_times=4239781 Epoche=2696\n",
      "Epsilon=0.657844 Action_times=4240550 Epoche=2697\n",
      "Epsilon=0.657797 Action_times=4241271 Epoche=2698\n",
      "Epsilon=0.657737 Action_times=4242200 Epoche=2699\n",
      "Epsilon=0.657643 Action_times=4243647 Epoche=2700\n",
      "Epsilon=0.657603 Action_times=4244264 Epoche=2701\n",
      "Epsilon=0.657567 Action_times=4244822 Epoche=2702\n",
      "Epsilon=0.657527 Action_times=4245445 Epoche=2703\n",
      "Epsilon=0.657436 Action_times=4246856 Epoche=2704\n",
      "Epsilon=0.657294 Action_times=4249045 Epoche=2705\n",
      "Epsilon=0.657224 Action_times=4250125 Epoche=2706\n",
      "Epsilon=0.657128 Action_times=4251601 Epoche=2707\n",
      "Epsilon=0.657099 Action_times=4252051 Epoche=2708\n",
      "Epsilon=0.657064 Action_times=4252599 Epoche=2709\n",
      "Epsilon=0.657022 Action_times=4253245 Epoche=2710\n",
      "Epsilon=0.656967 Action_times=4254104 Epoche=2711\n",
      "Epsilon=0.656898 Action_times=4255169 Epoche=2712\n",
      "Epsilon=0.656888 Action_times=4255318 Epoche=2713\n",
      "Epsilon=0.656841 Action_times=4256045 Epoche=2714\n",
      "Epsilon=0.656785 Action_times=4256917 Epoche=2715\n",
      "Epsilon=0.656698 Action_times=4258254 Epoche=2716\n",
      "Epsilon=0.656638 Action_times=4259177 Epoche=2717\n",
      "Epsilon=0.656592 Action_times=4259902 Epoche=2718\n",
      "Epsilon=0.656553 Action_times=4260504 Epoche=2719\n",
      "Epsilon=0.656458 Action_times=4261974 Epoche=2720\n",
      "Epsilon=0.656453 Action_times=4262040 Epoche=2721\n",
      "Epsilon=0.656435 Action_times=4262321 Epoche=2722\n",
      "Epsilon=0.656403 Action_times=4262812 Epoche=2723\n",
      "Epsilon=0.656334 Action_times=4263882 Epoche=2724\n",
      "Epsilon=0.656303 Action_times=4264361 Epoche=2725\n",
      "Epsilon=0.656260 Action_times=4265025 Epoche=2726\n",
      "Epsilon=0.656176 Action_times=4266324 Epoche=2727\n",
      "Epsilon=0.656083 Action_times=4267777 Epoche=2728\n",
      "Epsilon=0.656060 Action_times=4268128 Epoche=2729\n",
      "Epsilon=0.655992 Action_times=4269183 Epoche=2730\n",
      "Epsilon=0.655913 Action_times=4270407 Epoche=2731\n",
      "Epsilon=0.655868 Action_times=4271091 Epoche=2732\n",
      "Epsilon=0.655837 Action_times=4271574 Epoche=2733\n",
      "Epsilon=0.655827 Action_times=4271732 Epoche=2734\n",
      "Epsilon=0.655815 Action_times=4271917 Epoche=2735\n",
      "Epsilon=0.655779 Action_times=4272478 Epoche=2736\n",
      "Epsilon=0.655699 Action_times=4273711 Epoche=2737\n",
      "Epsilon=0.655622 Action_times=4274905 Epoche=2738\n",
      "Epsilon=0.655597 Action_times=4275302 Epoche=2739\n",
      "Epsilon=0.655517 Action_times=4276539 Epoche=2740\n",
      "Epsilon=0.655476 Action_times=4277164 Epoche=2741\n",
      "Epsilon=0.655407 Action_times=4278240 Epoche=2742\n",
      "Epsilon=0.655318 Action_times=4279623 Epoche=2743\n",
      "Epsilon=0.655250 Action_times=4280675 Epoche=2744\n",
      "Epsilon=0.655216 Action_times=4281205 Epoche=2745\n",
      "Epsilon=0.655137 Action_times=4282429 Epoche=2746\n",
      "Epsilon=0.655095 Action_times=4283072 Epoche=2747\n",
      "Epsilon=0.655058 Action_times=4283641 Epoche=2748\n",
      "Epsilon=0.655019 Action_times=4284250 Epoche=2749\n",
      "Epsilon=0.654971 Action_times=4284992 Epoche=2750\n",
      "Epsilon=0.654936 Action_times=4285544 Epoche=2751\n",
      "Epsilon=0.654906 Action_times=4286010 Epoche=2752\n",
      "Epsilon=0.654788 Action_times=4287841 Epoche=2753\n",
      "Epsilon=0.654751 Action_times=4288408 Epoche=2754\n",
      "Epsilon=0.654655 Action_times=4289899 Epoche=2755\n",
      "Epsilon=0.654508 Action_times=4292173 Epoche=2756\n",
      "Epsilon=0.654460 Action_times=4292926 Epoche=2757\n",
      "Epsilon=0.654403 Action_times=4293803 Epoche=2758\n",
      "Epsilon=0.654337 Action_times=4294828 Epoche=2759\n",
      "Epsilon=0.654297 Action_times=4295456 Epoche=2760\n",
      "Epsilon=0.654279 Action_times=4295738 Epoche=2761\n",
      "Epsilon=0.654190 Action_times=4297120 Epoche=2762\n",
      "Epsilon=0.654125 Action_times=4298114 Epoche=2763\n",
      "Epsilon=0.654117 Action_times=4298248 Epoche=2764\n",
      "Epsilon=0.654061 Action_times=4299112 Epoche=2765\n",
      "Epsilon=0.653963 Action_times=4300633 Epoche=2766\n",
      "Epsilon=0.653914 Action_times=4301402 Epoche=2767\n",
      "Epsilon=0.653911 Action_times=4301448 Epoche=2768\n",
      "Epsilon=0.653828 Action_times=4302734 Epoche=2769\n",
      "Epsilon=0.653794 Action_times=4303256 Epoche=2770\n",
      "Epsilon=0.653647 Action_times=4305546 Epoche=2771\n",
      "Epsilon=0.653569 Action_times=4306761 Epoche=2772\n",
      "Epsilon=0.653457 Action_times=4308504 Epoche=2773\n",
      "Epsilon=0.653373 Action_times=4309800 Epoche=2774\n",
      "Epsilon=0.653218 Action_times=4312212 Epoche=2775\n",
      "Epsilon=0.653147 Action_times=4313319 Epoche=2776\n",
      "Epsilon=0.653046 Action_times=4314889 Epoche=2777\n",
      "Epsilon=0.652957 Action_times=4316267 Epoche=2778\n",
      "Epsilon=0.652911 Action_times=4316983 Epoche=2779\n",
      "Epsilon=0.652837 Action_times=4318135 Epoche=2780\n",
      "Epsilon=0.652804 Action_times=4318658 Epoche=2781\n",
      "Epsilon=0.652795 Action_times=4318784 Epoche=2782\n",
      "Epsilon=0.652730 Action_times=4319796 Epoche=2783\n",
      "Epsilon=0.652715 Action_times=4320028 Epoche=2784\n",
      "Epsilon=0.652622 Action_times=4321486 Epoche=2785\n",
      "Epsilon=0.652512 Action_times=4323191 Epoche=2786\n",
      "Epsilon=0.652403 Action_times=4324897 Epoche=2787\n",
      "Epsilon=0.652314 Action_times=4326282 Epoche=2788\n",
      "Epsilon=0.652280 Action_times=4326804 Epoche=2789\n",
      "Epsilon=0.652150 Action_times=4328835 Epoche=2790\n",
      "Epsilon=0.652104 Action_times=4329541 Epoche=2791\n",
      "Epsilon=0.652025 Action_times=4330772 Epoche=2792\n",
      "Epsilon=0.652002 Action_times=4331139 Epoche=2793\n",
      "Epsilon=0.651941 Action_times=4332081 Epoche=2794\n",
      "Epsilon=0.651924 Action_times=4332348 Epoche=2795\n",
      "Epsilon=0.651867 Action_times=4333246 Epoche=2796\n",
      "Epsilon=0.651845 Action_times=4333582 Epoche=2797\n",
      "Epsilon=0.651794 Action_times=4334379 Epoche=2798\n",
      "Epsilon=0.651764 Action_times=4334839 Epoche=2799\n",
      "Epsilon=0.651717 Action_times=4335579 Epoche=2800\n",
      "Epsilon=0.651662 Action_times=4336428 Epoche=2801\n",
      "Epsilon=0.651559 Action_times=4338042 Epoche=2802\n",
      "Epsilon=0.651496 Action_times=4339025 Epoche=2803\n",
      "Epsilon=0.651359 Action_times=4341153 Epoche=2804\n",
      "Epsilon=0.651176 Action_times=4344010 Epoche=2805\n",
      "Epsilon=0.651120 Action_times=4344880 Epoche=2806\n",
      "Epsilon=0.651091 Action_times=4345343 Epoche=2807\n",
      "Epsilon=0.651030 Action_times=4346288 Epoche=2808\n",
      "Epsilon=0.650959 Action_times=4347397 Epoche=2809\n",
      "Epsilon=0.650857 Action_times=4348990 Epoche=2810\n",
      "Epsilon=0.650771 Action_times=4350324 Epoche=2811\n",
      "Epsilon=0.650702 Action_times=4351409 Epoche=2812\n",
      "Epsilon=0.650666 Action_times=4351962 Epoche=2813\n",
      "Epsilon=0.650533 Action_times=4354042 Epoche=2814\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.650481 Action_times=4354850 Epoche=2815\n",
      "Epsilon=0.650381 Action_times=4356419 Epoche=2816\n",
      "Epsilon=0.650304 Action_times=4357617 Epoche=2817\n",
      "Epsilon=0.650247 Action_times=4358514 Epoche=2818\n",
      "Epsilon=0.650168 Action_times=4359743 Epoche=2819\n",
      "Epsilon=0.650156 Action_times=4359928 Epoche=2820\n",
      "Epsilon=0.650104 Action_times=4360737 Epoche=2821\n",
      "Epsilon=0.650078 Action_times=4361153 Epoche=2822\n",
      "Epsilon=0.650024 Action_times=4361997 Epoche=2823\n",
      "Epsilon=0.649975 Action_times=4362763 Epoche=2824\n",
      "Epsilon=0.649957 Action_times=4363040 Epoche=2825\n",
      "Epsilon=0.649891 Action_times=4364071 Epoche=2826\n",
      "Epsilon=0.649824 Action_times=4365111 Epoche=2827\n",
      "Epsilon=0.649782 Action_times=4365780 Epoche=2828\n",
      "Epsilon=0.649685 Action_times=4367287 Epoche=2829\n",
      "Epsilon=0.649653 Action_times=4367793 Epoche=2830\n",
      "Epsilon=0.649624 Action_times=4368247 Epoche=2831\n",
      "Epsilon=0.649572 Action_times=4369062 Epoche=2832\n",
      "Epsilon=0.649533 Action_times=4369663 Epoche=2833\n",
      "Epsilon=0.649455 Action_times=4370888 Epoche=2834\n",
      "Epsilon=0.649409 Action_times=4371613 Epoche=2835\n",
      "Epsilon=0.649352 Action_times=4372498 Epoche=2836\n",
      "Epsilon=0.649301 Action_times=4373300 Epoche=2837\n",
      "Epsilon=0.649247 Action_times=4374142 Epoche=2838\n",
      "Epsilon=0.649110 Action_times=4376283 Epoche=2839\n",
      "Epsilon=0.648975 Action_times=4378392 Epoche=2840\n",
      "Epsilon=0.648961 Action_times=4378622 Epoche=2841\n",
      "Epsilon=0.648930 Action_times=4379106 Epoche=2842\n",
      "Epsilon=0.648883 Action_times=4379839 Epoche=2843\n",
      "Epsilon=0.648863 Action_times=4380154 Epoche=2844\n",
      "Epsilon=0.648832 Action_times=4380636 Epoche=2845\n",
      "Epsilon=0.648797 Action_times=4381177 Epoche=2846\n",
      "Epsilon=0.648716 Action_times=4382456 Epoche=2847\n",
      "Epsilon=0.648683 Action_times=4382963 Epoche=2848\n",
      "Epsilon=0.648681 Action_times=4383006 Epoche=2849\n",
      "Epsilon=0.648581 Action_times=4384557 Epoche=2850\n",
      "Epsilon=0.648545 Action_times=4385124 Epoche=2851\n",
      "Epsilon=0.648524 Action_times=4385463 Epoche=2852\n",
      "Epsilon=0.648454 Action_times=4386550 Epoche=2853\n",
      "Epsilon=0.648150 Action_times=4391313 Epoche=2854\n",
      "Epsilon=0.648109 Action_times=4391955 Epoche=2855\n",
      "Epsilon=0.648062 Action_times=4392695 Epoche=2856\n",
      "Epsilon=0.648039 Action_times=4393055 Epoche=2857\n",
      "Epsilon=0.648029 Action_times=4393207 Epoche=2858\n",
      "Epsilon=0.648023 Action_times=4393300 Epoche=2859\n",
      "Epsilon=0.647990 Action_times=4393828 Epoche=2860\n",
      "Epsilon=0.647937 Action_times=4394656 Epoche=2861\n",
      "Epsilon=0.647913 Action_times=4395026 Epoche=2862\n",
      "Epsilon=0.647907 Action_times=4395124 Epoche=2863\n",
      "Epsilon=0.647845 Action_times=4396104 Epoche=2864\n",
      "Epsilon=0.647716 Action_times=4398119 Epoche=2865\n",
      "Epsilon=0.647661 Action_times=4398986 Epoche=2866\n",
      "Epsilon=0.647623 Action_times=4399583 Epoche=2867\n",
      "Epsilon=0.647511 Action_times=4401338 Epoche=2868\n",
      "Epsilon=0.647461 Action_times=4402123 Epoche=2869\n",
      "Epsilon=0.647386 Action_times=4403292 Epoche=2870\n",
      "Epsilon=0.647342 Action_times=4403993 Epoche=2871\n",
      "Epsilon=0.647281 Action_times=4404940 Epoche=2872\n",
      "Epsilon=0.647259 Action_times=4405285 Epoche=2873\n",
      "Epsilon=0.647186 Action_times=4406431 Epoche=2874\n",
      "Epsilon=0.647100 Action_times=4407777 Epoche=2875\n",
      "Epsilon=0.647027 Action_times=4408930 Epoche=2876\n",
      "Epsilon=0.646931 Action_times=4410443 Epoche=2877\n",
      "Epsilon=0.646822 Action_times=4412141 Epoche=2878\n",
      "Epsilon=0.646743 Action_times=4413396 Epoche=2879\n",
      "Epsilon=0.646611 Action_times=4415455 Epoche=2880\n",
      "Epsilon=0.646551 Action_times=4416407 Epoche=2881\n",
      "Epsilon=0.646462 Action_times=4417802 Epoche=2882\n",
      "Epsilon=0.646386 Action_times=4418989 Epoche=2883\n",
      "Epsilon=0.646343 Action_times=4419669 Epoche=2884\n",
      "Epsilon=0.646303 Action_times=4420299 Epoche=2885\n",
      "Epsilon=0.646173 Action_times=4422344 Epoche=2886\n",
      "Epsilon=0.646113 Action_times=4423293 Epoche=2887\n",
      "Epsilon=0.646024 Action_times=4424691 Epoche=2888\n",
      "Epsilon=0.645969 Action_times=4425557 Epoche=2889\n",
      "Epsilon=0.645847 Action_times=4427471 Epoche=2890\n",
      "Epsilon=0.645815 Action_times=4427966 Epoche=2891\n",
      "Epsilon=0.645770 Action_times=4428680 Epoche=2892\n",
      "Epsilon=0.645758 Action_times=4428869 Epoche=2893\n",
      "Epsilon=0.645729 Action_times=4429318 Epoche=2894\n",
      "Epsilon=0.645692 Action_times=4429903 Epoche=2895\n",
      "Epsilon=0.645659 Action_times=4430434 Epoche=2896\n",
      "Epsilon=0.645601 Action_times=4431334 Epoche=2897\n",
      "Epsilon=0.645583 Action_times=4431623 Epoche=2898\n",
      "Epsilon=0.645461 Action_times=4433544 Epoche=2899\n",
      "Epsilon=0.645332 Action_times=4435567 Epoche=2900\n",
      "Epsilon=0.645219 Action_times=4437351 Epoche=2901\n",
      "Epsilon=0.645189 Action_times=4437822 Epoche=2902\n",
      "Epsilon=0.645152 Action_times=4438410 Epoche=2903\n",
      "Epsilon=0.645102 Action_times=4439199 Epoche=2904\n",
      "Epsilon=0.645090 Action_times=4439375 Epoche=2905\n",
      "Epsilon=0.644903 Action_times=4442326 Epoche=2906\n",
      "Epsilon=0.644766 Action_times=4444488 Epoche=2907\n",
      "Epsilon=0.644753 Action_times=4444692 Epoche=2908\n",
      "Epsilon=0.644633 Action_times=4446580 Epoche=2909\n",
      "Epsilon=0.644543 Action_times=4447996 Epoche=2910\n",
      "Epsilon=0.644459 Action_times=4449324 Epoche=2911\n",
      "Epsilon=0.644345 Action_times=4451126 Epoche=2912\n",
      "Epsilon=0.644332 Action_times=4451331 Epoche=2913\n",
      "Epsilon=0.644203 Action_times=4453353 Epoche=2914\n",
      "Epsilon=0.644147 Action_times=4454249 Epoche=2915\n",
      "Epsilon=0.644069 Action_times=4455477 Epoche=2916\n",
      "Epsilon=0.643962 Action_times=4457163 Epoche=2917\n",
      "Epsilon=0.643942 Action_times=4457479 Epoche=2918\n",
      "Epsilon=0.643903 Action_times=4458087 Epoche=2919\n",
      "Epsilon=0.643834 Action_times=4459175 Epoche=2920\n",
      "Epsilon=0.643706 Action_times=4461198 Epoche=2921\n",
      "Epsilon=0.643650 Action_times=4462085 Epoche=2922\n",
      "Epsilon=0.643537 Action_times=4463870 Epoche=2923\n",
      "Epsilon=0.643502 Action_times=4464410 Epoche=2924\n",
      "Epsilon=0.643452 Action_times=4465211 Epoche=2925\n",
      "Epsilon=0.643351 Action_times=4466799 Epoche=2926\n",
      "Epsilon=0.643339 Action_times=4466986 Epoche=2927\n",
      "Epsilon=0.643274 Action_times=4468021 Epoche=2928\n",
      "Epsilon=0.643231 Action_times=4468697 Epoche=2929\n",
      "Epsilon=0.643194 Action_times=4469284 Epoche=2930\n",
      "Epsilon=0.643093 Action_times=4470880 Epoche=2931\n",
      "Epsilon=0.643068 Action_times=4471277 Epoche=2932\n",
      "Epsilon=0.642928 Action_times=4473489 Epoche=2933\n",
      "Epsilon=0.642782 Action_times=4475785 Epoche=2934\n",
      "Epsilon=0.642683 Action_times=4477348 Epoche=2935\n",
      "Epsilon=0.642625 Action_times=4478273 Epoche=2936\n",
      "Epsilon=0.642600 Action_times=4478666 Epoche=2937\n",
      "Epsilon=0.642539 Action_times=4479625 Epoche=2938\n",
      "Epsilon=0.642468 Action_times=4480760 Epoche=2939\n",
      "Epsilon=0.642446 Action_times=4481104 Epoche=2940\n",
      "Epsilon=0.642401 Action_times=4481816 Epoche=2941\n",
      "Epsilon=0.642377 Action_times=4482190 Epoche=2942\n",
      "Epsilon=0.642302 Action_times=4483381 Epoche=2943\n",
      "Epsilon=0.642234 Action_times=4484453 Epoche=2944\n",
      "Epsilon=0.642166 Action_times=4485528 Epoche=2945\n",
      "Epsilon=0.642084 Action_times=4486824 Epoche=2946\n",
      "Epsilon=0.642043 Action_times=4487480 Epoche=2947\n",
      "Epsilon=0.641997 Action_times=4488197 Epoche=2948\n",
      "Epsilon=0.641957 Action_times=4488834 Epoche=2949\n",
      "Epsilon=0.641916 Action_times=4489480 Epoche=2950\n",
      "Epsilon=0.641879 Action_times=4490066 Epoche=2951\n",
      "Epsilon=0.641835 Action_times=4490767 Epoche=2952\n",
      "Epsilon=0.641800 Action_times=4491325 Epoche=2953\n",
      "Epsilon=0.641684 Action_times=4493159 Epoche=2954\n",
      "Epsilon=0.641625 Action_times=4494096 Epoche=2955\n",
      "Epsilon=0.641513 Action_times=4495857 Epoche=2956\n",
      "Epsilon=0.641332 Action_times=4498733 Epoche=2957\n",
      "Epsilon=0.641237 Action_times=4500228 Epoche=2958\n",
      "Epsilon=0.641191 Action_times=4500971 Epoche=2959\n",
      "Epsilon=0.641185 Action_times=4501054 Epoche=2960\n",
      "Epsilon=0.641129 Action_times=4501945 Epoche=2961\n",
      "Epsilon=0.641061 Action_times=4503019 Epoche=2962\n",
      "Epsilon=0.641017 Action_times=4503726 Epoche=2963\n",
      "Epsilon=0.641005 Action_times=4503908 Epoche=2964\n",
      "Epsilon=0.640944 Action_times=4504884 Epoche=2965\n",
      "Epsilon=0.640805 Action_times=4507075 Epoche=2966\n",
      "Epsilon=0.640772 Action_times=4507610 Epoche=2967\n",
      "Epsilon=0.640655 Action_times=4509461 Epoche=2968\n",
      "Epsilon=0.640608 Action_times=4510206 Epoche=2969\n",
      "Epsilon=0.640554 Action_times=4511055 Epoche=2970\n",
      "Epsilon=0.640528 Action_times=4511480 Epoche=2971\n",
      "Epsilon=0.640392 Action_times=4513628 Epoche=2972\n",
      "Epsilon=0.640318 Action_times=4514801 Epoche=2973\n",
      "Epsilon=0.640224 Action_times=4516300 Epoche=2974\n",
      "Epsilon=0.640127 Action_times=4517836 Epoche=2975\n",
      "Epsilon=0.640074 Action_times=4518674 Epoche=2976\n",
      "Epsilon=0.640036 Action_times=4519287 Epoche=2977\n",
      "Epsilon=0.639939 Action_times=4520812 Epoche=2978\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.639817 Action_times=4522763 Epoche=2979\n",
      "Epsilon=0.639809 Action_times=4522888 Epoche=2980\n",
      "Epsilon=0.639725 Action_times=4524213 Epoche=2981\n",
      "Epsilon=0.639665 Action_times=4525172 Epoche=2982\n",
      "Epsilon=0.639635 Action_times=4525646 Epoche=2983\n",
      "Epsilon=0.639578 Action_times=4526549 Epoche=2984\n",
      "Epsilon=0.639497 Action_times=4527838 Epoche=2985\n",
      "Epsilon=0.639413 Action_times=4529170 Epoche=2986\n",
      "Epsilon=0.639386 Action_times=4529598 Epoche=2987\n",
      "Epsilon=0.639253 Action_times=4531714 Epoche=2988\n",
      "Epsilon=0.639228 Action_times=4532107 Epoche=2989\n",
      "Epsilon=0.639149 Action_times=4533365 Epoche=2990\n",
      "Epsilon=0.639098 Action_times=4534177 Epoche=2991\n",
      "Epsilon=0.639037 Action_times=4535148 Epoche=2992\n",
      "Epsilon=0.638937 Action_times=4536744 Epoche=2993\n",
      "Epsilon=0.638816 Action_times=4538668 Epoche=2994\n",
      "Epsilon=0.638735 Action_times=4539953 Epoche=2995\n",
      "Epsilon=0.638695 Action_times=4540591 Epoche=2996\n",
      "Epsilon=0.638672 Action_times=4540948 Epoche=2997\n",
      "Epsilon=0.638480 Action_times=4544006 Epoche=2998\n",
      "Epsilon=0.638416 Action_times=4545029 Epoche=2999\n",
      "1\n",
      "***********************************************************\n",
      "Succeed to initialize Q-Table!\n",
      "***********************************************************\n",
      "Epsilon=0.992738 Action_times=73624 Epoche=3000\n",
      "Epsilon=0.992505 Action_times=75991 Epoche=3001\n",
      "Epsilon=0.991572 Action_times=85493 Epoche=3002\n",
      "Epsilon=0.990936 Action_times=91979 Epoche=3003\n",
      "Epsilon=0.989789 Action_times=103678 Epoche=3004\n",
      "Epsilon=0.989288 Action_times=108790 Epoche=3005\n",
      "Epsilon=0.988443 Action_times=117423 Epoche=3006\n",
      "Epsilon=0.985637 Action_times=146148 Epoche=3007\n",
      "Epsilon=0.985217 Action_times=150449 Epoche=3008\n",
      "Epsilon=0.985032 Action_times=152350 Epoche=3009\n",
      "Epsilon=0.984286 Action_times=159997 Epoche=3010\n",
      "Epsilon=0.983730 Action_times=165706 Epoche=3011\n",
      "Epsilon=0.983198 Action_times=171169 Epoche=3012\n",
      "Epsilon=0.983099 Action_times=172191 Epoche=3013\n",
      "Epsilon=0.982460 Action_times=178763 Epoche=3014\n",
      "Epsilon=0.981762 Action_times=185939 Epoche=3015\n",
      "Epsilon=0.980327 Action_times=200722 Epoche=3016\n",
      "Epsilon=0.979903 Action_times=205090 Epoche=3017\n",
      "Epsilon=0.979215 Action_times=212184 Epoche=3018\n",
      "Epsilon=0.978250 Action_times=222151 Epoche=3019\n",
      "Epsilon=0.977736 Action_times=227457 Epoche=3020\n",
      "Epsilon=0.976719 Action_times=237968 Epoche=3021\n",
      "Epsilon=0.976266 Action_times=242658 Epoche=3022\n",
      "Epsilon=0.975572 Action_times=249846 Epoche=3023\n",
      "Epsilon=0.974659 Action_times=259300 Epoche=3024\n",
      "Epsilon=0.974467 Action_times=261292 Epoche=3025\n",
      "Epsilon=0.974342 Action_times=262592 Epoche=3026\n",
      "Epsilon=0.972201 Action_times=284816 Epoche=3027\n",
      "Epsilon=0.971180 Action_times=295428 Epoche=3028\n",
      "Epsilon=0.971089 Action_times=296375 Epoche=3029\n",
      "Epsilon=0.970307 Action_times=304521 Epoche=3030\n",
      "Epsilon=0.970080 Action_times=306881 Epoche=3031\n",
      "Epsilon=0.969707 Action_times=310768 Epoche=3032\n",
      "Epsilon=0.969647 Action_times=311397 Epoche=3033\n",
      "Epsilon=0.968506 Action_times=323286 Epoche=3034\n",
      "Epsilon=0.968221 Action_times=326261 Epoche=3035\n",
      "Epsilon=0.967983 Action_times=328747 Epoche=3036\n",
      "Epsilon=0.967692 Action_times=331783 Epoche=3037\n",
      "Epsilon=0.967325 Action_times=335616 Epoche=3038\n",
      "Epsilon=0.966857 Action_times=340511 Epoche=3039\n",
      "Epsilon=0.966159 Action_times=347808 Epoche=3040\n",
      "Epsilon=0.965404 Action_times=355706 Epoche=3041\n",
      "Epsilon=0.965111 Action_times=358772 Epoche=3042\n",
      "Epsilon=0.964545 Action_times=364698 Epoche=3043\n",
      "Epsilon=0.963770 Action_times=372824 Epoche=3044\n",
      "Epsilon=0.963432 Action_times=376373 Epoche=3045\n",
      "Epsilon=0.963221 Action_times=378579 Epoche=3046\n",
      "Epsilon=0.962927 Action_times=381670 Epoche=3047\n",
      "Epsilon=0.962445 Action_times=386728 Epoche=3048\n",
      "Epsilon=0.962176 Action_times=389552 Epoche=3049\n",
      "Epsilon=0.961427 Action_times=397420 Epoche=3050\n",
      "Epsilon=0.961212 Action_times=399678 Epoche=3051\n",
      "Epsilon=0.960942 Action_times=402517 Epoche=3052\n",
      "Epsilon=0.960846 Action_times=403532 Epoche=3053\n",
      "Epsilon=0.960323 Action_times=409029 Epoche=3054\n",
      "Epsilon=0.959925 Action_times=413218 Epoche=3055\n",
      "Epsilon=0.959752 Action_times=415044 Epoche=3056\n",
      "Epsilon=0.959283 Action_times=419982 Epoche=3057\n",
      "Epsilon=0.958906 Action_times=423947 Epoche=3058\n",
      "Epsilon=0.958606 Action_times=427119 Epoche=3059\n",
      "Epsilon=0.958470 Action_times=428552 Epoche=3060\n",
      "Epsilon=0.958014 Action_times=433358 Epoche=3061\n",
      "Epsilon=0.957751 Action_times=436135 Epoche=3062\n",
      "Epsilon=0.957180 Action_times=442158 Epoche=3063\n",
      "Epsilon=0.956615 Action_times=448130 Epoche=3064\n",
      "Epsilon=0.955870 Action_times=456003 Epoche=3065\n",
      "Epsilon=0.955584 Action_times=459026 Epoche=3066\n",
      "Epsilon=0.955129 Action_times=463836 Epoche=3067\n",
      "Epsilon=0.955034 Action_times=464845 Epoche=3068\n",
      "Epsilon=0.954802 Action_times=467296 Epoche=3069\n",
      "Epsilon=0.954312 Action_times=472479 Epoche=3070\n",
      "Epsilon=0.953617 Action_times=479845 Epoche=3071\n",
      "Epsilon=0.953386 Action_times=482289 Epoche=3072\n",
      "Epsilon=0.952881 Action_times=487646 Epoche=3073\n",
      "Epsilon=0.952741 Action_times=489130 Epoche=3074\n",
      "Epsilon=0.952336 Action_times=493433 Epoche=3075\n",
      "Epsilon=0.951707 Action_times=500110 Epoche=3076\n",
      "Epsilon=0.951342 Action_times=503985 Epoche=3077\n",
      "Epsilon=0.951121 Action_times=506327 Epoche=3078\n",
      "Epsilon=0.950838 Action_times=509342 Epoche=3079\n",
      "Epsilon=0.950594 Action_times=511938 Epoche=3080\n",
      "Epsilon=0.950431 Action_times=513667 Epoche=3081\n",
      "Epsilon=0.950404 Action_times=513957 Epoche=3082\n",
      "Epsilon=0.949907 Action_times=519245 Epoche=3083\n",
      "Epsilon=0.949538 Action_times=523167 Epoche=3084\n",
      "Epsilon=0.949262 Action_times=526107 Epoche=3085\n",
      "Epsilon=0.949099 Action_times=527837 Epoche=3086\n",
      "Epsilon=0.948929 Action_times=529655 Epoche=3087\n",
      "Epsilon=0.948719 Action_times=531888 Epoche=3088\n",
      "Epsilon=0.948341 Action_times=535911 Epoche=3089\n",
      "Epsilon=0.947921 Action_times=540393 Epoche=3090\n",
      "Epsilon=0.947532 Action_times=544539 Epoche=3091\n",
      "Epsilon=0.947349 Action_times=546489 Epoche=3092\n",
      "Epsilon=0.947315 Action_times=546854 Epoche=3093\n",
      "Epsilon=0.946828 Action_times=552057 Epoche=3094\n",
      "Epsilon=0.946679 Action_times=553642 Epoche=3095\n",
      "Epsilon=0.946259 Action_times=558127 Epoche=3096\n",
      "Epsilon=0.945940 Action_times=561531 Epoche=3097\n",
      "Epsilon=0.945506 Action_times=566172 Epoche=3098\n",
      "Epsilon=0.945214 Action_times=569297 Epoche=3099\n",
      "Epsilon=0.945133 Action_times=570158 Epoche=3100\n",
      "Epsilon=0.944789 Action_times=573842 Epoche=3101\n",
      "Epsilon=0.944537 Action_times=576541 Epoche=3102\n",
      "Epsilon=0.944083 Action_times=581400 Epoche=3103\n",
      "Epsilon=0.943803 Action_times=584396 Epoche=3104\n",
      "Epsilon=0.943785 Action_times=584592 Epoche=3105\n",
      "Epsilon=0.943579 Action_times=586795 Epoche=3106\n",
      "Epsilon=0.943274 Action_times=590065 Epoche=3107\n",
      "Epsilon=0.943163 Action_times=591250 Epoche=3108\n",
      "Epsilon=0.942120 Action_times=602437 Epoche=3109\n",
      "Epsilon=0.941613 Action_times=607876 Epoche=3110\n",
      "Epsilon=0.941498 Action_times=609106 Epoche=3111\n",
      "Epsilon=0.941395 Action_times=610214 Epoche=3112\n",
      "Epsilon=0.940698 Action_times=617705 Epoche=3113\n",
      "Epsilon=0.940604 Action_times=618712 Epoche=3114\n",
      "Epsilon=0.940451 Action_times=620351 Epoche=3115\n",
      "Epsilon=0.940191 Action_times=623153 Epoche=3116\n",
      "Epsilon=0.940085 Action_times=624294 Epoche=3117\n",
      "Epsilon=0.939680 Action_times=628646 Epoche=3118\n",
      "Epsilon=0.939560 Action_times=629933 Epoche=3119\n",
      "Epsilon=0.939483 Action_times=630763 Epoche=3120\n",
      "Epsilon=0.939079 Action_times=635111 Epoche=3121\n",
      "Epsilon=0.938810 Action_times=638009 Epoche=3122\n",
      "Epsilon=0.938664 Action_times=639576 Epoche=3123\n",
      "Epsilon=0.938655 Action_times=639676 Epoche=3124\n",
      "Epsilon=0.938591 Action_times=640361 Epoche=3125\n",
      "Epsilon=0.938407 Action_times=642351 Epoche=3126\n",
      "Epsilon=0.938136 Action_times=645265 Epoche=3127\n",
      "Epsilon=0.937862 Action_times=648224 Epoche=3128\n",
      "Epsilon=0.937246 Action_times=654862 Epoche=3129\n",
      "Epsilon=0.937154 Action_times=655850 Epoche=3130\n",
      "Epsilon=0.936752 Action_times=660190 Epoche=3131\n",
      "Epsilon=0.936709 Action_times=660656 Epoche=3132\n",
      "Epsilon=0.936450 Action_times=663454 Epoche=3133\n",
      "Epsilon=0.936317 Action_times=664885 Epoche=3134\n",
      "Epsilon=0.936209 Action_times=666054 Epoche=3135\n",
      "Epsilon=0.936166 Action_times=666514 Epoche=3136\n",
      "Epsilon=0.936045 Action_times=667821 Epoche=3137\n",
      "Epsilon=0.935555 Action_times=673109 Epoche=3138\n",
      "Epsilon=0.935124 Action_times=677772 Epoche=3139\n",
      "Epsilon=0.935044 Action_times=678632 Epoche=3140\n",
      "Epsilon=0.934913 Action_times=680054 Epoche=3141\n",
      "Epsilon=0.934442 Action_times=685141 Epoche=3142\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.933957 Action_times=690399 Epoche=3143\n",
      "Epsilon=0.933761 Action_times=692513 Epoche=3144\n",
      "Epsilon=0.933603 Action_times=694231 Epoche=3145\n",
      "Epsilon=0.933442 Action_times=695971 Epoche=3146\n",
      "Epsilon=0.933127 Action_times=699378 Epoche=3147\n",
      "Epsilon=0.932737 Action_times=703603 Epoche=3148\n",
      "Epsilon=0.932372 Action_times=707561 Epoche=3149\n",
      "Epsilon=0.932280 Action_times=708561 Epoche=3150\n",
      "Epsilon=0.932146 Action_times=710012 Epoche=3151\n",
      "Epsilon=0.932002 Action_times=711571 Epoche=3152\n",
      "Epsilon=0.931940 Action_times=712248 Epoche=3153\n",
      "Epsilon=0.931718 Action_times=714654 Epoche=3154\n",
      "Epsilon=0.931372 Action_times=718406 Epoche=3155\n",
      "Epsilon=0.931099 Action_times=721372 Epoche=3156\n",
      "Epsilon=0.931042 Action_times=721991 Epoche=3157\n",
      "Epsilon=0.930715 Action_times=725546 Epoche=3158\n",
      "Epsilon=0.930443 Action_times=728502 Epoche=3159\n",
      "Epsilon=0.930273 Action_times=730344 Epoche=3160\n",
      "Epsilon=0.930272 Action_times=730360 Epoche=3161\n",
      "Epsilon=0.930247 Action_times=730633 Epoche=3162\n",
      "Epsilon=0.930242 Action_times=730686 Epoche=3163\n",
      "Epsilon=0.930022 Action_times=733070 Epoche=3164\n",
      "Epsilon=0.929716 Action_times=736395 Epoche=3165\n",
      "Epsilon=0.929350 Action_times=740385 Epoche=3166\n",
      "Epsilon=0.929096 Action_times=743141 Epoche=3167\n",
      "Epsilon=0.928916 Action_times=745105 Epoche=3168\n",
      "Epsilon=0.928635 Action_times=748162 Epoche=3169\n",
      "Epsilon=0.928519 Action_times=749427 Epoche=3170\n",
      "Epsilon=0.928343 Action_times=751343 Epoche=3171\n",
      "Epsilon=0.927669 Action_times=758683 Epoche=3172\n",
      "Epsilon=0.927386 Action_times=761762 Epoche=3173\n",
      "Epsilon=0.927119 Action_times=764673 Epoche=3174\n",
      "Epsilon=0.926932 Action_times=766720 Epoche=3175\n",
      "Epsilon=0.926783 Action_times=768343 Epoche=3176\n",
      "Epsilon=0.926649 Action_times=769805 Epoche=3177\n",
      "Epsilon=0.926587 Action_times=770481 Epoche=3178\n",
      "Epsilon=0.926476 Action_times=771691 Epoche=3179\n",
      "Epsilon=0.926011 Action_times=776770 Epoche=3180\n",
      "Epsilon=0.925877 Action_times=778230 Epoche=3181\n",
      "Epsilon=0.925829 Action_times=778748 Epoche=3182\n",
      "Epsilon=0.925523 Action_times=782096 Epoche=3183\n",
      "Epsilon=0.925265 Action_times=784915 Epoche=3184\n",
      "Epsilon=0.925107 Action_times=786635 Epoche=3185\n",
      "Epsilon=0.925056 Action_times=787200 Epoche=3186\n",
      "Epsilon=0.924813 Action_times=789856 Epoche=3187\n",
      "Epsilon=0.924791 Action_times=790097 Epoche=3188\n",
      "Epsilon=0.924466 Action_times=793644 Epoche=3189\n",
      "Epsilon=0.924422 Action_times=794132 Epoche=3190\n",
      "Epsilon=0.924334 Action_times=795086 Epoche=3191\n",
      "Epsilon=0.924135 Action_times=797262 Epoche=3192\n",
      "Epsilon=0.923768 Action_times=801285 Epoche=3193\n",
      "Epsilon=0.923704 Action_times=801982 Epoche=3194\n",
      "Epsilon=0.923700 Action_times=802022 Epoche=3195\n",
      "Epsilon=0.923548 Action_times=803686 Epoche=3196\n",
      "Epsilon=0.923037 Action_times=809287 Epoche=3197\n",
      "Epsilon=0.922617 Action_times=813883 Epoche=3198\n",
      "Epsilon=0.922348 Action_times=816839 Epoche=3199\n",
      "Epsilon=0.922329 Action_times=817043 Epoche=3200\n",
      "Epsilon=0.922097 Action_times=819588 Epoche=3201\n",
      "Epsilon=0.921798 Action_times=822861 Epoche=3202\n",
      "Epsilon=0.921566 Action_times=825410 Epoche=3203\n",
      "Epsilon=0.921373 Action_times=827523 Epoche=3204\n",
      "Epsilon=0.921192 Action_times=829510 Epoche=3205\n",
      "Epsilon=0.920881 Action_times=832924 Epoche=3206\n",
      "Epsilon=0.920737 Action_times=834513 Epoche=3207\n",
      "Epsilon=0.920605 Action_times=835955 Epoche=3208\n",
      "Epsilon=0.920443 Action_times=837731 Epoche=3209\n",
      "Epsilon=0.920325 Action_times=839031 Epoche=3210\n",
      "Epsilon=0.920221 Action_times=840174 Epoche=3211\n",
      "Epsilon=0.920081 Action_times=841710 Epoche=3212\n",
      "Epsilon=0.919982 Action_times=842805 Epoche=3213\n",
      "Epsilon=0.919812 Action_times=844665 Epoche=3214\n",
      "Epsilon=0.919686 Action_times=846051 Epoche=3215\n",
      "Epsilon=0.919476 Action_times=848363 Epoche=3216\n",
      "Epsilon=0.919293 Action_times=850378 Epoche=3217\n",
      "Epsilon=0.918821 Action_times=855568 Epoche=3218\n",
      "Epsilon=0.918521 Action_times=858869 Epoche=3219\n",
      "Epsilon=0.918404 Action_times=860158 Epoche=3220\n",
      "Epsilon=0.918307 Action_times=861223 Epoche=3221\n",
      "Epsilon=0.918100 Action_times=863503 Epoche=3222\n",
      "Epsilon=0.917970 Action_times=864938 Epoche=3223\n",
      "Epsilon=0.917802 Action_times=866792 Epoche=3224\n",
      "Epsilon=0.917695 Action_times=867966 Epoche=3225\n",
      "Epsilon=0.917441 Action_times=870763 Epoche=3226\n",
      "Epsilon=0.917311 Action_times=872201 Epoche=3227\n",
      "Epsilon=0.917073 Action_times=874817 Epoche=3228\n",
      "Epsilon=0.916819 Action_times=877619 Epoche=3229\n",
      "Epsilon=0.916684 Action_times=879108 Epoche=3230\n",
      "Epsilon=0.916173 Action_times=884742 Epoche=3231\n",
      "Epsilon=0.915780 Action_times=889080 Epoche=3232\n",
      "Epsilon=0.915684 Action_times=890148 Epoche=3233\n",
      "Epsilon=0.915511 Action_times=892050 Epoche=3234\n",
      "Epsilon=0.915371 Action_times=893605 Epoche=3235\n",
      "Epsilon=0.915205 Action_times=895439 Epoche=3236\n",
      "Epsilon=0.915055 Action_times=897095 Epoche=3237\n",
      "Epsilon=0.914940 Action_times=898358 Epoche=3238\n",
      "Epsilon=0.914710 Action_times=900909 Epoche=3239\n",
      "Epsilon=0.914436 Action_times=903938 Epoche=3240\n",
      "Epsilon=0.914185 Action_times=906715 Epoche=3241\n",
      "Epsilon=0.914087 Action_times=907796 Epoche=3242\n",
      "Epsilon=0.913881 Action_times=910071 Epoche=3243\n",
      "Epsilon=0.913469 Action_times=914633 Epoche=3244\n",
      "Epsilon=0.913253 Action_times=917020 Epoche=3245\n",
      "Epsilon=0.913102 Action_times=918695 Epoche=3246\n",
      "Epsilon=0.912972 Action_times=920135 Epoche=3247\n",
      "Epsilon=0.912904 Action_times=920885 Epoche=3248\n",
      "Epsilon=0.912715 Action_times=922980 Epoche=3249\n",
      "Epsilon=0.912386 Action_times=926623 Epoche=3250\n",
      "Epsilon=0.912276 Action_times=927846 Epoche=3251\n",
      "Epsilon=0.911993 Action_times=930980 Epoche=3252\n",
      "Epsilon=0.911836 Action_times=932722 Epoche=3253\n",
      "Epsilon=0.911704 Action_times=934183 Epoche=3254\n",
      "Epsilon=0.911602 Action_times=935315 Epoche=3255\n",
      "Epsilon=0.911420 Action_times=937341 Epoche=3256\n",
      "Epsilon=0.911255 Action_times=939169 Epoche=3257\n",
      "Epsilon=0.911035 Action_times=941607 Epoche=3258\n",
      "Epsilon=0.910797 Action_times=944245 Epoche=3259\n",
      "Epsilon=0.910689 Action_times=945451 Epoche=3260\n",
      "Epsilon=0.910252 Action_times=950300 Epoche=3261\n",
      "Epsilon=0.909918 Action_times=954011 Epoche=3262\n",
      "Epsilon=0.909797 Action_times=955357 Epoche=3263\n",
      "Epsilon=0.909644 Action_times=957053 Epoche=3264\n",
      "Epsilon=0.909620 Action_times=957323 Epoche=3265\n",
      "Epsilon=0.909409 Action_times=959673 Epoche=3266\n",
      "Epsilon=0.909247 Action_times=961474 Epoche=3267\n",
      "Epsilon=0.909111 Action_times=962979 Epoche=3268\n",
      "Epsilon=0.908732 Action_times=967205 Epoche=3269\n",
      "Epsilon=0.908664 Action_times=967955 Epoche=3270\n",
      "Epsilon=0.908447 Action_times=970375 Epoche=3271\n",
      "Epsilon=0.908306 Action_times=971938 Epoche=3272\n",
      "Epsilon=0.908124 Action_times=973967 Epoche=3273\n",
      "Epsilon=0.907925 Action_times=976181 Epoche=3274\n",
      "Epsilon=0.907802 Action_times=977558 Epoche=3275\n",
      "Epsilon=0.907620 Action_times=979586 Epoche=3276\n",
      "Epsilon=0.907595 Action_times=979860 Epoche=3277\n",
      "Epsilon=0.907289 Action_times=983271 Epoche=3278\n",
      "Epsilon=0.906899 Action_times=987618 Epoche=3279\n",
      "Epsilon=0.906580 Action_times=991173 Epoche=3280\n",
      "Epsilon=0.906499 Action_times=992079 Epoche=3281\n",
      "Epsilon=0.906375 Action_times=993466 Epoche=3282\n",
      "Epsilon=0.906053 Action_times=997056 Epoche=3283\n",
      "Epsilon=0.905944 Action_times=998273 Epoche=3284\n",
      "Epsilon=0.905691 Action_times=1001091 Epoche=3285\n",
      "Epsilon=0.905436 Action_times=1003937 Epoche=3286\n",
      "Epsilon=0.905388 Action_times=1004476 Epoche=3287\n",
      "Epsilon=0.905181 Action_times=1006794 Epoche=3288\n",
      "Epsilon=0.905129 Action_times=1007367 Epoche=3289\n",
      "Epsilon=0.905110 Action_times=1007587 Epoche=3290\n",
      "Epsilon=0.904965 Action_times=1009208 Epoche=3291\n",
      "Epsilon=0.904708 Action_times=1012077 Epoche=3292\n",
      "Epsilon=0.904610 Action_times=1013170 Epoche=3293\n",
      "Epsilon=0.904519 Action_times=1014192 Epoche=3294\n",
      "Epsilon=0.904255 Action_times=1017139 Epoche=3295\n",
      "Epsilon=0.904144 Action_times=1018379 Epoche=3296\n",
      "Epsilon=0.904100 Action_times=1018868 Epoche=3297\n",
      "Epsilon=0.903855 Action_times=1021612 Epoche=3298\n",
      "Epsilon=0.903822 Action_times=1021979 Epoche=3299\n",
      "Epsilon=0.903703 Action_times=1023316 Epoche=3300\n",
      "Epsilon=0.903477 Action_times=1025847 Epoche=3301\n",
      "Epsilon=0.903319 Action_times=1027616 Epoche=3302\n",
      "Epsilon=0.903299 Action_times=1027834 Epoche=3303\n",
      "Epsilon=0.903092 Action_times=1030149 Epoche=3304\n",
      "Epsilon=0.902890 Action_times=1032416 Epoche=3305\n",
      "Epsilon=0.902808 Action_times=1033332 Epoche=3306\n",
      "Epsilon=0.902284 Action_times=1039205 Epoche=3307\n",
      "Epsilon=0.902087 Action_times=1041410 Epoche=3308\n",
      "Epsilon=0.901832 Action_times=1044267 Epoche=3309\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.901789 Action_times=1044754 Epoche=3310\n",
      "Epsilon=0.901618 Action_times=1046673 Epoche=3311\n",
      "Epsilon=0.901411 Action_times=1048990 Epoche=3312\n",
      "Epsilon=0.901211 Action_times=1051235 Epoche=3313\n",
      "Epsilon=0.901056 Action_times=1052975 Epoche=3314\n",
      "Epsilon=0.900880 Action_times=1054948 Epoche=3315\n",
      "Epsilon=0.900494 Action_times=1059284 Epoche=3316\n",
      "Epsilon=0.900444 Action_times=1059849 Epoche=3317\n",
      "Epsilon=0.900363 Action_times=1060752 Epoche=3318\n",
      "Epsilon=0.900168 Action_times=1062942 Epoche=3319\n",
      "Epsilon=0.899967 Action_times=1065206 Epoche=3320\n",
      "Epsilon=0.899880 Action_times=1066184 Epoche=3321\n",
      "Epsilon=0.899748 Action_times=1067670 Epoche=3322\n",
      "Epsilon=0.899431 Action_times=1071228 Epoche=3323\n",
      "Epsilon=0.899246 Action_times=1073315 Epoche=3324\n",
      "Epsilon=0.898858 Action_times=1077674 Epoche=3325\n",
      "Epsilon=0.898853 Action_times=1077734 Epoche=3326\n",
      "Epsilon=0.898550 Action_times=1081135 Epoche=3327\n",
      "Epsilon=0.898258 Action_times=1084424 Epoche=3328\n",
      "Epsilon=0.898057 Action_times=1086690 Epoche=3329\n",
      "Epsilon=0.897555 Action_times=1092348 Epoche=3330\n",
      "Epsilon=0.897416 Action_times=1093916 Epoche=3331\n",
      "Epsilon=0.897396 Action_times=1094139 Epoche=3332\n",
      "Epsilon=0.897371 Action_times=1094419 Epoche=3333\n",
      "Epsilon=0.897181 Action_times=1096561 Epoche=3334\n",
      "Epsilon=0.896793 Action_times=1100938 Epoche=3335\n",
      "Epsilon=0.896718 Action_times=1101782 Epoche=3336\n",
      "Epsilon=0.896624 Action_times=1102837 Epoche=3337\n",
      "Epsilon=0.896537 Action_times=1103819 Epoche=3338\n",
      "Epsilon=0.896258 Action_times=1106968 Epoche=3339\n",
      "Epsilon=0.896005 Action_times=1109819 Epoche=3340\n",
      "Epsilon=0.895710 Action_times=1113151 Epoche=3341\n",
      "Epsilon=0.895445 Action_times=1116148 Epoche=3342\n",
      "Epsilon=0.895435 Action_times=1116255 Epoche=3343\n",
      "Epsilon=0.895251 Action_times=1118337 Epoche=3344\n",
      "Epsilon=0.895048 Action_times=1120634 Epoche=3345\n",
      "Epsilon=0.894886 Action_times=1122456 Epoche=3346\n",
      "Epsilon=0.894832 Action_times=1123075 Epoche=3347\n",
      "Epsilon=0.894551 Action_times=1126249 Epoche=3348\n",
      "Epsilon=0.894452 Action_times=1127369 Epoche=3349\n",
      "Epsilon=0.894327 Action_times=1128785 Epoche=3350\n",
      "Epsilon=0.894132 Action_times=1130989 Epoche=3351\n",
      "Epsilon=0.893981 Action_times=1132699 Epoche=3352\n",
      "Epsilon=0.893943 Action_times=1133129 Epoche=3353\n",
      "Epsilon=0.893914 Action_times=1133457 Epoche=3354\n",
      "Epsilon=0.893698 Action_times=1135899 Epoche=3355\n",
      "Epsilon=0.893391 Action_times=1139372 Epoche=3356\n",
      "Epsilon=0.893034 Action_times=1143412 Epoche=3357\n",
      "Epsilon=0.892822 Action_times=1145817 Epoche=3358\n",
      "Epsilon=0.892566 Action_times=1148714 Epoche=3359\n",
      "Epsilon=0.892363 Action_times=1151019 Epoche=3360\n",
      "Epsilon=0.892160 Action_times=1153313 Epoche=3361\n",
      "Epsilon=0.891938 Action_times=1155837 Epoche=3362\n",
      "Epsilon=0.891892 Action_times=1156350 Epoche=3363\n",
      "Epsilon=0.891784 Action_times=1157582 Epoche=3364\n",
      "Epsilon=0.891608 Action_times=1159570 Epoche=3365\n",
      "Epsilon=0.891440 Action_times=1161485 Epoche=3366\n",
      "Epsilon=0.891199 Action_times=1164211 Epoche=3367\n",
      "Epsilon=0.891047 Action_times=1165937 Epoche=3368\n",
      "Epsilon=0.890737 Action_times=1169454 Epoche=3369\n",
      "Epsilon=0.890617 Action_times=1170825 Epoche=3370\n",
      "Epsilon=0.890435 Action_times=1172889 Epoche=3371\n",
      "Epsilon=0.890212 Action_times=1175417 Epoche=3372\n",
      "Epsilon=0.890185 Action_times=1175733 Epoche=3373\n",
      "Epsilon=0.890078 Action_times=1176949 Epoche=3374\n",
      "Epsilon=0.889721 Action_times=1181004 Epoche=3375\n",
      "Epsilon=0.889588 Action_times=1182511 Epoche=3376\n",
      "Epsilon=0.889449 Action_times=1184093 Epoche=3377\n",
      "Epsilon=0.889355 Action_times=1185168 Epoche=3378\n",
      "Epsilon=0.889285 Action_times=1185962 Epoche=3379\n",
      "Epsilon=0.889187 Action_times=1187069 Epoche=3380\n",
      "Epsilon=0.889007 Action_times=1189121 Epoche=3381\n",
      "Epsilon=0.888841 Action_times=1191014 Epoche=3382\n",
      "Epsilon=0.888741 Action_times=1192152 Epoche=3383\n",
      "Epsilon=0.888646 Action_times=1193229 Epoche=3384\n",
      "Epsilon=0.888455 Action_times=1195399 Epoche=3385\n",
      "Epsilon=0.888206 Action_times=1198240 Epoche=3386\n",
      "Epsilon=0.888107 Action_times=1199368 Epoche=3387\n",
      "Epsilon=0.887943 Action_times=1201238 Epoche=3388\n",
      "Epsilon=0.887807 Action_times=1202782 Epoche=3389\n",
      "Epsilon=0.887554 Action_times=1205669 Epoche=3390\n",
      "Epsilon=0.887423 Action_times=1207159 Epoche=3391\n",
      "Epsilon=0.887212 Action_times=1209559 Epoche=3392\n",
      "Epsilon=0.886959 Action_times=1212442 Epoche=3393\n",
      "Epsilon=0.886807 Action_times=1214186 Epoche=3394\n",
      "Epsilon=0.886629 Action_times=1216207 Epoche=3395\n",
      "Epsilon=0.886516 Action_times=1217495 Epoche=3396\n",
      "Epsilon=0.886338 Action_times=1219536 Epoche=3397\n",
      "Epsilon=0.886276 Action_times=1220241 Epoche=3398\n",
      "Epsilon=0.886080 Action_times=1222476 Epoche=3399\n",
      "Epsilon=0.885988 Action_times=1223523 Epoche=3400\n",
      "Epsilon=0.885814 Action_times=1225515 Epoche=3401\n",
      "Epsilon=0.885654 Action_times=1227334 Epoche=3402\n",
      "Epsilon=0.885505 Action_times=1229046 Epoche=3403\n",
      "Epsilon=0.885460 Action_times=1229556 Epoche=3404\n",
      "Epsilon=0.885358 Action_times=1230722 Epoche=3405\n",
      "Epsilon=0.885059 Action_times=1234133 Epoche=3406\n",
      "Epsilon=0.885038 Action_times=1234376 Epoche=3407\n",
      "Epsilon=0.884831 Action_times=1236737 Epoche=3408\n",
      "Epsilon=0.884708 Action_times=1238148 Epoche=3409\n",
      "Epsilon=0.884658 Action_times=1238725 Epoche=3410\n",
      "Epsilon=0.884594 Action_times=1239456 Epoche=3411\n",
      "Epsilon=0.884292 Action_times=1242900 Epoche=3412\n",
      "Epsilon=0.884134 Action_times=1244710 Epoche=3413\n",
      "Epsilon=0.883929 Action_times=1247055 Epoche=3414\n",
      "Epsilon=0.883842 Action_times=1248054 Epoche=3415\n",
      "Epsilon=0.883798 Action_times=1248560 Epoche=3416\n",
      "Epsilon=0.883614 Action_times=1250662 Epoche=3417\n",
      "Epsilon=0.883543 Action_times=1251479 Epoche=3418\n",
      "Epsilon=0.883404 Action_times=1253068 Epoche=3419\n",
      "Epsilon=0.883222 Action_times=1255146 Epoche=3420\n",
      "Epsilon=0.883193 Action_times=1255487 Epoche=3421\n",
      "Epsilon=0.882811 Action_times=1259859 Epoche=3422\n",
      "Epsilon=0.882567 Action_times=1262658 Epoche=3423\n",
      "Epsilon=0.882338 Action_times=1265278 Epoche=3424\n",
      "Epsilon=0.882140 Action_times=1267547 Epoche=3425\n",
      "Epsilon=0.882060 Action_times=1268468 Epoche=3426\n",
      "Epsilon=0.881681 Action_times=1272812 Epoche=3427\n",
      "Epsilon=0.881504 Action_times=1274847 Epoche=3428\n",
      "Epsilon=0.881385 Action_times=1276214 Epoche=3429\n",
      "Epsilon=0.881345 Action_times=1276667 Epoche=3430\n",
      "Epsilon=0.881258 Action_times=1277667 Epoche=3431\n",
      "Epsilon=0.881239 Action_times=1277885 Epoche=3432\n",
      "Epsilon=0.881070 Action_times=1279830 Epoche=3433\n",
      "Epsilon=0.880789 Action_times=1283055 Epoche=3434\n",
      "Epsilon=0.880758 Action_times=1283414 Epoche=3435\n",
      "Epsilon=0.880619 Action_times=1285006 Epoche=3436\n",
      "Epsilon=0.880374 Action_times=1287820 Epoche=3437\n",
      "Epsilon=0.880211 Action_times=1289692 Epoche=3438\n",
      "Epsilon=0.880197 Action_times=1289850 Epoche=3439\n",
      "Epsilon=0.880063 Action_times=1291392 Epoche=3440\n",
      "Epsilon=0.879863 Action_times=1293694 Epoche=3441\n",
      "Epsilon=0.879647 Action_times=1296178 Epoche=3442\n",
      "Epsilon=0.879428 Action_times=1298689 Epoche=3443\n",
      "Epsilon=0.879170 Action_times=1301661 Epoche=3444\n",
      "Epsilon=0.878958 Action_times=1304099 Epoche=3445\n",
      "Epsilon=0.878899 Action_times=1304778 Epoche=3446\n",
      "Epsilon=0.878463 Action_times=1309801 Epoche=3447\n",
      "Epsilon=0.878441 Action_times=1310050 Epoche=3448\n",
      "Epsilon=0.878269 Action_times=1312032 Epoche=3449\n",
      "Epsilon=0.878134 Action_times=1313583 Epoche=3450\n",
      "Epsilon=0.877852 Action_times=1316833 Epoche=3451\n",
      "Epsilon=0.877775 Action_times=1317721 Epoche=3452\n",
      "Epsilon=0.877459 Action_times=1321368 Epoche=3453\n",
      "Epsilon=0.877399 Action_times=1322063 Epoche=3454\n",
      "Epsilon=0.877259 Action_times=1323671 Epoche=3455\n",
      "Epsilon=0.877087 Action_times=1325651 Epoche=3456\n",
      "Epsilon=0.876793 Action_times=1329044 Epoche=3457\n",
      "Epsilon=0.876761 Action_times=1329417 Epoche=3458\n",
      "Epsilon=0.876613 Action_times=1331121 Epoche=3459\n",
      "Epsilon=0.876485 Action_times=1332606 Epoche=3460\n",
      "Epsilon=0.876372 Action_times=1333906 Epoche=3461\n",
      "Epsilon=0.876212 Action_times=1335754 Epoche=3462\n",
      "Epsilon=0.876061 Action_times=1337496 Epoche=3463\n",
      "Epsilon=0.875839 Action_times=1340055 Epoche=3464\n",
      "Epsilon=0.875661 Action_times=1342116 Epoche=3465\n",
      "Epsilon=0.875585 Action_times=1342998 Epoche=3466\n",
      "Epsilon=0.875426 Action_times=1344825 Epoche=3467\n",
      "Epsilon=0.875235 Action_times=1347042 Epoche=3468\n",
      "Epsilon=0.875007 Action_times=1349677 Epoche=3469\n",
      "Epsilon=0.874721 Action_times=1352985 Epoche=3470\n",
      "Epsilon=0.874457 Action_times=1356032 Epoche=3471\n",
      "Epsilon=0.874066 Action_times=1360555 Epoche=3472\n",
      "Epsilon=0.874038 Action_times=1360882 Epoche=3473\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.873999 Action_times=1361334 Epoche=3474\n",
      "Epsilon=0.873873 Action_times=1362793 Epoche=3475\n",
      "Epsilon=0.873716 Action_times=1364610 Epoche=3476\n",
      "Epsilon=0.873623 Action_times=1365686 Epoche=3477\n",
      "Epsilon=0.873451 Action_times=1367681 Epoche=3478\n",
      "Epsilon=0.873200 Action_times=1370584 Epoche=3479\n",
      "Epsilon=0.873137 Action_times=1371315 Epoche=3480\n",
      "Epsilon=0.873025 Action_times=1372614 Epoche=3481\n",
      "Epsilon=0.872855 Action_times=1374584 Epoche=3482\n",
      "Epsilon=0.872640 Action_times=1377076 Epoche=3483\n",
      "Epsilon=0.872459 Action_times=1379171 Epoche=3484\n",
      "Epsilon=0.872313 Action_times=1380869 Epoche=3485\n",
      "Epsilon=0.872218 Action_times=1381966 Epoche=3486\n",
      "Epsilon=0.872028 Action_times=1384169 Epoche=3487\n",
      "Epsilon=0.871997 Action_times=1384533 Epoche=3488\n",
      "Epsilon=0.871901 Action_times=1385645 Epoche=3489\n",
      "Epsilon=0.871519 Action_times=1390080 Epoche=3490\n",
      "Epsilon=0.871372 Action_times=1391785 Epoche=3491\n",
      "Epsilon=0.871350 Action_times=1392042 Epoche=3492\n",
      "Epsilon=0.871244 Action_times=1393276 Epoche=3493\n",
      "Epsilon=0.871150 Action_times=1394364 Epoche=3494\n",
      "Epsilon=0.870972 Action_times=1396433 Epoche=3495\n",
      "Epsilon=0.870697 Action_times=1399622 Epoche=3496\n",
      "Epsilon=0.870565 Action_times=1401156 Epoche=3497\n",
      "Epsilon=0.870529 Action_times=1401574 Epoche=3498\n",
      "Epsilon=0.870344 Action_times=1403730 Epoche=3499\n",
      "Epsilon=0.870156 Action_times=1405906 Epoche=3500\n",
      "Epsilon=0.870080 Action_times=1406790 Epoche=3501\n",
      "Epsilon=0.869921 Action_times=1408641 Epoche=3502\n",
      "Epsilon=0.869798 Action_times=1410080 Epoche=3503\n",
      "Epsilon=0.869723 Action_times=1410942 Epoche=3504\n",
      "Epsilon=0.869535 Action_times=1413130 Epoche=3505\n",
      "Epsilon=0.869368 Action_times=1415082 Epoche=3506\n",
      "Epsilon=0.869278 Action_times=1416126 Epoche=3507\n",
      "Epsilon=0.869021 Action_times=1419113 Epoche=3508\n",
      "Epsilon=0.868862 Action_times=1420971 Epoche=3509\n",
      "Epsilon=0.868499 Action_times=1425189 Epoche=3510\n",
      "Epsilon=0.868361 Action_times=1426799 Epoche=3511\n",
      "Epsilon=0.868234 Action_times=1428283 Epoche=3512\n",
      "Epsilon=0.868002 Action_times=1430983 Epoche=3513\n",
      "Epsilon=0.867878 Action_times=1432435 Epoche=3514\n",
      "Epsilon=0.867506 Action_times=1436770 Epoche=3515\n",
      "Epsilon=0.867425 Action_times=1437718 Epoche=3516\n",
      "Epsilon=0.867359 Action_times=1438481 Epoche=3517\n",
      "Epsilon=0.867309 Action_times=1439065 Epoche=3518\n",
      "Epsilon=0.867220 Action_times=1440099 Epoche=3519\n",
      "Epsilon=0.867172 Action_times=1440665 Epoche=3520\n",
      "Epsilon=0.866920 Action_times=1443603 Epoche=3521\n",
      "Epsilon=0.866798 Action_times=1445028 Epoche=3522\n",
      "Epsilon=0.866677 Action_times=1446438 Epoche=3523\n",
      "Epsilon=0.866533 Action_times=1448125 Epoche=3524\n",
      "Epsilon=0.866417 Action_times=1449476 Epoche=3525\n",
      "Epsilon=0.866243 Action_times=1451508 Epoche=3526\n",
      "Epsilon=0.866137 Action_times=1452749 Epoche=3527\n",
      "Epsilon=0.865953 Action_times=1454896 Epoche=3528\n",
      "Epsilon=0.865723 Action_times=1457583 Epoche=3529\n",
      "Epsilon=0.865595 Action_times=1459077 Epoche=3530\n",
      "Epsilon=0.865406 Action_times=1461283 Epoche=3531\n",
      "Epsilon=0.865241 Action_times=1463214 Epoche=3532\n",
      "Epsilon=0.864936 Action_times=1466784 Epoche=3533\n",
      "Epsilon=0.864808 Action_times=1468278 Epoche=3534\n",
      "Epsilon=0.864584 Action_times=1470898 Epoche=3535\n",
      "Epsilon=0.864394 Action_times=1473126 Epoche=3536\n",
      "Epsilon=0.864301 Action_times=1474211 Epoche=3537\n",
      "Epsilon=0.864109 Action_times=1476458 Epoche=3538\n",
      "Epsilon=0.863913 Action_times=1478755 Epoche=3539\n",
      "Epsilon=0.863790 Action_times=1480194 Epoche=3540\n",
      "Epsilon=0.863631 Action_times=1482060 Epoche=3541\n",
      "Epsilon=0.863398 Action_times=1484793 Epoche=3542\n",
      "Epsilon=0.863193 Action_times=1487193 Epoche=3543\n",
      "Epsilon=0.863164 Action_times=1487536 Epoche=3544\n",
      "Epsilon=0.863057 Action_times=1488785 Epoche=3545\n",
      "Epsilon=0.863000 Action_times=1489458 Epoche=3546\n",
      "Epsilon=0.862958 Action_times=1489941 Epoche=3547\n",
      "Epsilon=0.862828 Action_times=1491467 Epoche=3548\n",
      "Epsilon=0.862642 Action_times=1493653 Epoche=3549\n",
      "Epsilon=0.862512 Action_times=1495181 Epoche=3550\n",
      "Epsilon=0.862378 Action_times=1496743 Epoche=3551\n",
      "Epsilon=0.862320 Action_times=1497432 Epoche=3552\n",
      "Epsilon=0.862215 Action_times=1498656 Epoche=3553\n",
      "Epsilon=0.862088 Action_times=1500156 Epoche=3554\n",
      "Epsilon=0.862041 Action_times=1500707 Epoche=3555\n",
      "Epsilon=0.861931 Action_times=1501995 Epoche=3556\n",
      "Epsilon=0.861854 Action_times=1502899 Epoche=3557\n",
      "Epsilon=0.861792 Action_times=1503629 Epoche=3558\n",
      "Epsilon=0.861689 Action_times=1504838 Epoche=3559\n",
      "Epsilon=0.861580 Action_times=1506119 Epoche=3560\n",
      "Epsilon=0.861514 Action_times=1506885 Epoche=3561\n",
      "Epsilon=0.861476 Action_times=1507331 Epoche=3562\n",
      "Epsilon=0.861284 Action_times=1509596 Epoche=3563\n",
      "Epsilon=0.861223 Action_times=1510305 Epoche=3564\n",
      "Epsilon=0.861189 Action_times=1510704 Epoche=3565\n",
      "Epsilon=0.861102 Action_times=1511733 Epoche=3566\n",
      "Epsilon=0.861009 Action_times=1512825 Epoche=3567\n",
      "Epsilon=0.860901 Action_times=1514097 Epoche=3568\n",
      "Epsilon=0.860730 Action_times=1516105 Epoche=3569\n",
      "Epsilon=0.860685 Action_times=1516630 Epoche=3570\n",
      "Epsilon=0.860570 Action_times=1517977 Epoche=3571\n",
      "Epsilon=0.860457 Action_times=1519315 Epoche=3572\n",
      "Epsilon=0.860373 Action_times=1520293 Epoche=3573\n",
      "Epsilon=0.860322 Action_times=1520895 Epoche=3574\n",
      "Epsilon=0.860267 Action_times=1521540 Epoche=3575\n",
      "Epsilon=0.860234 Action_times=1521934 Epoche=3576\n",
      "Epsilon=0.860102 Action_times=1523482 Epoche=3577\n",
      "Epsilon=0.859963 Action_times=1525120 Epoche=3578\n",
      "Epsilon=0.859914 Action_times=1525698 Epoche=3579\n",
      "Epsilon=0.859754 Action_times=1527579 Epoche=3580\n",
      "Epsilon=0.859702 Action_times=1528187 Epoche=3581\n",
      "Epsilon=0.859581 Action_times=1529622 Epoche=3582\n",
      "Epsilon=0.859339 Action_times=1532460 Epoche=3583\n",
      "Epsilon=0.859202 Action_times=1534084 Epoche=3584\n",
      "Epsilon=0.859095 Action_times=1535339 Epoche=3585\n",
      "Epsilon=0.858953 Action_times=1537013 Epoche=3586\n",
      "Epsilon=0.858759 Action_times=1539295 Epoche=3587\n",
      "Epsilon=0.858578 Action_times=1541435 Epoche=3588\n",
      "Epsilon=0.858479 Action_times=1542599 Epoche=3589\n",
      "Epsilon=0.858367 Action_times=1543919 Epoche=3590\n",
      "Epsilon=0.858169 Action_times=1546250 Epoche=3591\n",
      "Epsilon=0.858095 Action_times=1547122 Epoche=3592\n",
      "Epsilon=0.857957 Action_times=1548753 Epoche=3593\n",
      "Epsilon=0.857931 Action_times=1549060 Epoche=3594\n",
      "Epsilon=0.857699 Action_times=1551799 Epoche=3595\n",
      "Epsilon=0.857655 Action_times=1552308 Epoche=3596\n",
      "Epsilon=0.857534 Action_times=1553742 Epoche=3597\n",
      "Epsilon=0.857285 Action_times=1556684 Epoche=3598\n",
      "Epsilon=0.857267 Action_times=1556886 Epoche=3599\n",
      "Epsilon=0.857094 Action_times=1558929 Epoche=3600\n",
      "Epsilon=0.856853 Action_times=1561776 Epoche=3601\n",
      "Epsilon=0.856673 Action_times=1563909 Epoche=3602\n",
      "Epsilon=0.856516 Action_times=1565758 Epoche=3603\n",
      "Epsilon=0.856382 Action_times=1567347 Epoche=3604\n",
      "Epsilon=0.856147 Action_times=1570116 Epoche=3605\n",
      "Epsilon=0.856081 Action_times=1570902 Epoche=3606\n",
      "Epsilon=0.855956 Action_times=1572371 Epoche=3607\n",
      "Epsilon=0.855768 Action_times=1574595 Epoche=3608\n",
      "Epsilon=0.855658 Action_times=1575900 Epoche=3609\n",
      "Epsilon=0.855579 Action_times=1576830 Epoche=3610\n",
      "Epsilon=0.855492 Action_times=1577864 Epoche=3611\n",
      "Epsilon=0.855127 Action_times=1582177 Epoche=3612\n",
      "Epsilon=0.855028 Action_times=1583356 Epoche=3613\n",
      "Epsilon=0.854855 Action_times=1585404 Epoche=3614\n",
      "Epsilon=0.854808 Action_times=1585956 Epoche=3615\n",
      "Epsilon=0.854511 Action_times=1589473 Epoche=3616\n",
      "Epsilon=0.854192 Action_times=1593244 Epoche=3617\n",
      "Epsilon=0.854026 Action_times=1595217 Epoche=3618\n",
      "Epsilon=0.853838 Action_times=1597448 Epoche=3619\n",
      "Epsilon=0.853693 Action_times=1599167 Epoche=3620\n",
      "Epsilon=0.853424 Action_times=1602355 Epoche=3621\n",
      "Epsilon=0.853315 Action_times=1603642 Epoche=3622\n",
      "Epsilon=0.853136 Action_times=1605764 Epoche=3623\n",
      "Epsilon=0.852998 Action_times=1607405 Epoche=3624\n",
      "Epsilon=0.852898 Action_times=1608587 Epoche=3625\n",
      "Epsilon=0.852774 Action_times=1610058 Epoche=3626\n",
      "Epsilon=0.852503 Action_times=1613276 Epoche=3627\n",
      "Epsilon=0.852433 Action_times=1614110 Epoche=3628\n",
      "Epsilon=0.852380 Action_times=1614737 Epoche=3629\n",
      "Epsilon=0.852274 Action_times=1615993 Epoche=3630\n",
      "Epsilon=0.852167 Action_times=1617268 Epoche=3631\n",
      "Epsilon=0.852109 Action_times=1617950 Epoche=3632\n",
      "Epsilon=0.851947 Action_times=1619873 Epoche=3633\n",
      "Epsilon=0.851879 Action_times=1620682 Epoche=3634\n",
      "Epsilon=0.851650 Action_times=1623402 Epoche=3635\n",
      "Epsilon=0.851613 Action_times=1623846 Epoche=3636\n",
      "Epsilon=0.851474 Action_times=1625494 Epoche=3637\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.851380 Action_times=1626613 Epoche=3638\n",
      "Epsilon=0.851224 Action_times=1628464 Epoche=3639\n",
      "Epsilon=0.851109 Action_times=1629837 Epoche=3640\n",
      "Epsilon=0.850957 Action_times=1631644 Epoche=3641\n",
      "Epsilon=0.850777 Action_times=1633781 Epoche=3642\n",
      "Epsilon=0.850685 Action_times=1634881 Epoche=3643\n",
      "Epsilon=0.850584 Action_times=1636084 Epoche=3644\n",
      "Epsilon=0.850452 Action_times=1637652 Epoche=3645\n",
      "Epsilon=0.850076 Action_times=1642129 Epoche=3646\n",
      "Epsilon=0.849844 Action_times=1644884 Epoche=3647\n",
      "Epsilon=0.849625 Action_times=1647490 Epoche=3648\n",
      "Epsilon=0.849558 Action_times=1648297 Epoche=3649\n",
      "Epsilon=0.849467 Action_times=1649373 Epoche=3650\n",
      "Epsilon=0.849349 Action_times=1650779 Epoche=3651\n",
      "Epsilon=0.849212 Action_times=1652414 Epoche=3652\n",
      "Epsilon=0.849165 Action_times=1652981 Epoche=3653\n",
      "Epsilon=0.848929 Action_times=1655791 Epoche=3654\n",
      "Epsilon=0.848891 Action_times=1656237 Epoche=3655\n",
      "Epsilon=0.848763 Action_times=1657767 Epoche=3656\n",
      "Epsilon=0.848574 Action_times=1660018 Epoche=3657\n",
      "Epsilon=0.848469 Action_times=1661270 Epoche=3658\n",
      "Epsilon=0.848324 Action_times=1663003 Epoche=3659\n",
      "Epsilon=0.848239 Action_times=1664019 Epoche=3660\n",
      "Epsilon=0.848020 Action_times=1666627 Epoche=3661\n",
      "Epsilon=0.847902 Action_times=1668033 Epoche=3662\n",
      "Epsilon=0.847836 Action_times=1668827 Epoche=3663\n",
      "Epsilon=0.847700 Action_times=1670454 Epoche=3664\n",
      "Epsilon=0.847591 Action_times=1671753 Epoche=3665\n",
      "Epsilon=0.847444 Action_times=1673507 Epoche=3666\n",
      "Epsilon=0.847268 Action_times=1675603 Epoche=3667\n",
      "Epsilon=0.847106 Action_times=1677543 Epoche=3668\n",
      "Epsilon=0.847048 Action_times=1678238 Epoche=3669\n",
      "Epsilon=0.846535 Action_times=1684365 Epoche=3670\n",
      "Epsilon=0.846452 Action_times=1685362 Epoche=3671\n",
      "Epsilon=0.846346 Action_times=1686621 Epoche=3672\n",
      "Epsilon=0.846291 Action_times=1687280 Epoche=3673\n",
      "Epsilon=0.846123 Action_times=1689292 Epoche=3674\n",
      "Epsilon=0.846017 Action_times=1690561 Epoche=3675\n",
      "Epsilon=0.845719 Action_times=1694121 Epoche=3676\n",
      "Epsilon=0.845514 Action_times=1696582 Epoche=3677\n",
      "Epsilon=0.845319 Action_times=1698912 Epoche=3678\n",
      "Epsilon=0.845311 Action_times=1699007 Epoche=3679\n",
      "Epsilon=0.845051 Action_times=1702116 Epoche=3680\n",
      "Epsilon=0.844886 Action_times=1704095 Epoche=3681\n",
      "Epsilon=0.844529 Action_times=1708376 Epoche=3682\n",
      "Epsilon=0.844482 Action_times=1708943 Epoche=3683\n",
      "Epsilon=0.844298 Action_times=1711139 Epoche=3684\n",
      "Epsilon=0.843950 Action_times=1715317 Epoche=3685\n",
      "Epsilon=0.843945 Action_times=1715370 Epoche=3686\n",
      "Epsilon=0.843937 Action_times=1715469 Epoche=3687\n",
      "Epsilon=0.843922 Action_times=1715646 Epoche=3688\n",
      "Epsilon=0.843672 Action_times=1718645 Epoche=3689\n",
      "Epsilon=0.843620 Action_times=1719275 Epoche=3690\n",
      "Epsilon=0.843579 Action_times=1719767 Epoche=3691\n",
      "Epsilon=0.843521 Action_times=1720465 Epoche=3692\n",
      "Epsilon=0.843370 Action_times=1722276 Epoche=3693\n",
      "Epsilon=0.843212 Action_times=1724163 Epoche=3694\n",
      "Epsilon=0.843146 Action_times=1724962 Epoche=3695\n",
      "Epsilon=0.843062 Action_times=1725963 Epoche=3696\n",
      "Epsilon=0.842807 Action_times=1729032 Epoche=3697\n",
      "Epsilon=0.842748 Action_times=1729740 Epoche=3698\n",
      "Epsilon=0.842692 Action_times=1730411 Epoche=3699\n",
      "Epsilon=0.842477 Action_times=1732990 Epoche=3700\n",
      "Epsilon=0.842424 Action_times=1733636 Epoche=3701\n",
      "Epsilon=0.842366 Action_times=1734324 Epoche=3702\n",
      "Epsilon=0.842256 Action_times=1735645 Epoche=3703\n",
      "Epsilon=0.842054 Action_times=1738077 Epoche=3704\n",
      "Epsilon=0.841984 Action_times=1738913 Epoche=3705\n",
      "Epsilon=0.841970 Action_times=1739091 Epoche=3706\n",
      "Epsilon=0.841830 Action_times=1740765 Epoche=3707\n",
      "Epsilon=0.841783 Action_times=1741328 Epoche=3708\n",
      "Epsilon=0.841612 Action_times=1743395 Epoche=3709\n",
      "Epsilon=0.841496 Action_times=1744789 Epoche=3710\n",
      "Epsilon=0.841283 Action_times=1747343 Epoche=3711\n",
      "Epsilon=0.841234 Action_times=1747938 Epoche=3712\n",
      "Epsilon=0.841120 Action_times=1749307 Epoche=3713\n",
      "Epsilon=0.841050 Action_times=1750151 Epoche=3714\n",
      "Epsilon=0.840813 Action_times=1753004 Epoche=3715\n",
      "Epsilon=0.840674 Action_times=1754677 Epoche=3716\n",
      "Epsilon=0.840588 Action_times=1755707 Epoche=3717\n",
      "Epsilon=0.840564 Action_times=1756002 Epoche=3718\n",
      "Epsilon=0.840460 Action_times=1757251 Epoche=3719\n",
      "Epsilon=0.840315 Action_times=1758993 Epoche=3720\n",
      "Epsilon=0.840253 Action_times=1759740 Epoche=3721\n",
      "Epsilon=0.840167 Action_times=1760786 Epoche=3722\n",
      "Epsilon=0.840086 Action_times=1761762 Epoche=3723\n",
      "Epsilon=0.839963 Action_times=1763238 Epoche=3724\n",
      "Epsilon=0.839839 Action_times=1764736 Epoche=3725\n",
      "Epsilon=0.839795 Action_times=1765259 Epoche=3726\n",
      "Epsilon=0.839749 Action_times=1765812 Epoche=3727\n",
      "Epsilon=0.839527 Action_times=1768488 Epoche=3728\n",
      "Epsilon=0.839378 Action_times=1770284 Epoche=3729\n",
      "Epsilon=0.839332 Action_times=1770848 Epoche=3730\n",
      "Epsilon=0.839192 Action_times=1772529 Epoche=3731\n",
      "Epsilon=0.839082 Action_times=1773859 Epoche=3732\n",
      "Epsilon=0.838995 Action_times=1774912 Epoche=3733\n",
      "Epsilon=0.838928 Action_times=1775717 Epoche=3734\n",
      "Epsilon=0.838896 Action_times=1776107 Epoche=3735\n",
      "Epsilon=0.838741 Action_times=1777970 Epoche=3736\n",
      "Epsilon=0.838551 Action_times=1780267 Epoche=3737\n",
      "Epsilon=0.838459 Action_times=1781380 Epoche=3738\n",
      "Epsilon=0.838374 Action_times=1782402 Epoche=3739\n",
      "Epsilon=0.838266 Action_times=1783710 Epoche=3740\n",
      "Epsilon=0.838192 Action_times=1784599 Epoche=3741\n",
      "Epsilon=0.838059 Action_times=1786205 Epoche=3742\n",
      "Epsilon=0.837963 Action_times=1787366 Epoche=3743\n",
      "Epsilon=0.837905 Action_times=1788065 Epoche=3744\n",
      "Epsilon=0.837706 Action_times=1790475 Epoche=3745\n",
      "Epsilon=0.837489 Action_times=1793087 Epoche=3746\n",
      "Epsilon=0.837313 Action_times=1795219 Epoche=3747\n",
      "Epsilon=0.837187 Action_times=1796744 Epoche=3748\n",
      "Epsilon=0.837122 Action_times=1797529 Epoche=3749\n",
      "Epsilon=0.837022 Action_times=1798740 Epoche=3750\n",
      "Epsilon=0.836784 Action_times=1801618 Epoche=3751\n",
      "Epsilon=0.836710 Action_times=1802515 Epoche=3752\n",
      "Epsilon=0.836559 Action_times=1804339 Epoche=3753\n",
      "Epsilon=0.836508 Action_times=1804951 Epoche=3754\n",
      "Epsilon=0.836402 Action_times=1806240 Epoche=3755\n",
      "Epsilon=0.836329 Action_times=1807124 Epoche=3756\n",
      "Epsilon=0.836295 Action_times=1807530 Epoche=3757\n",
      "Epsilon=0.836232 Action_times=1808289 Epoche=3758\n",
      "Epsilon=0.836218 Action_times=1808463 Epoche=3759\n",
      "Epsilon=0.836141 Action_times=1809391 Epoche=3760\n",
      "Epsilon=0.836123 Action_times=1809612 Epoche=3761\n",
      "Epsilon=0.835925 Action_times=1812015 Epoche=3762\n",
      "Epsilon=0.835825 Action_times=1813224 Epoche=3763\n",
      "Epsilon=0.835737 Action_times=1814292 Epoche=3764\n",
      "Epsilon=0.835580 Action_times=1816183 Epoche=3765\n",
      "Epsilon=0.835349 Action_times=1818986 Epoche=3766\n",
      "Epsilon=0.835098 Action_times=1822031 Epoche=3767\n",
      "Epsilon=0.834908 Action_times=1824333 Epoche=3768\n",
      "Epsilon=0.834812 Action_times=1825496 Epoche=3769\n",
      "Epsilon=0.834749 Action_times=1826256 Epoche=3770\n",
      "Epsilon=0.834706 Action_times=1826777 Epoche=3771\n",
      "Epsilon=0.834626 Action_times=1827751 Epoche=3772\n",
      "Epsilon=0.834483 Action_times=1829485 Epoche=3773\n",
      "Epsilon=0.834411 Action_times=1830356 Epoche=3774\n",
      "Epsilon=0.834360 Action_times=1830976 Epoche=3775\n",
      "Epsilon=0.834293 Action_times=1831793 Epoche=3776\n",
      "Epsilon=0.834200 Action_times=1832916 Epoche=3777\n",
      "Epsilon=0.833960 Action_times=1835830 Epoche=3778\n",
      "Epsilon=0.833825 Action_times=1837470 Epoche=3779\n",
      "Epsilon=0.833692 Action_times=1839084 Epoche=3780\n",
      "Epsilon=0.833663 Action_times=1839432 Epoche=3781\n",
      "Epsilon=0.833416 Action_times=1842431 Epoche=3782\n",
      "Epsilon=0.833221 Action_times=1844804 Epoche=3783\n",
      "Epsilon=0.833026 Action_times=1847177 Epoche=3784\n",
      "Epsilon=0.832954 Action_times=1848044 Epoche=3785\n",
      "Epsilon=0.832776 Action_times=1850206 Epoche=3786\n",
      "Epsilon=0.832729 Action_times=1850776 Epoche=3787\n",
      "Epsilon=0.832592 Action_times=1852443 Epoche=3788\n",
      "Epsilon=0.832549 Action_times=1852969 Epoche=3789\n",
      "Epsilon=0.832449 Action_times=1854182 Epoche=3790\n",
      "Epsilon=0.832191 Action_times=1857321 Epoche=3791\n",
      "Epsilon=0.831926 Action_times=1860544 Epoche=3792\n",
      "Epsilon=0.831872 Action_times=1861199 Epoche=3793\n",
      "Epsilon=0.831612 Action_times=1864362 Epoche=3794\n",
      "Epsilon=0.831505 Action_times=1865672 Epoche=3795\n",
      "Epsilon=0.831230 Action_times=1869023 Epoche=3796\n",
      "Epsilon=0.831150 Action_times=1869995 Epoche=3797\n",
      "Epsilon=0.830961 Action_times=1872296 Epoche=3798\n",
      "Epsilon=0.830781 Action_times=1874486 Epoche=3799\n",
      "Epsilon=0.830679 Action_times=1875726 Epoche=3800\n",
      "Epsilon=0.830567 Action_times=1877092 Epoche=3801\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.830515 Action_times=1877728 Epoche=3802\n",
      "Epsilon=0.830479 Action_times=1878162 Epoche=3803\n",
      "Epsilon=0.830436 Action_times=1878691 Epoche=3804\n",
      "Epsilon=0.830347 Action_times=1879771 Epoche=3805\n",
      "Epsilon=0.830336 Action_times=1879911 Epoche=3806\n",
      "Epsilon=0.830170 Action_times=1881937 Epoche=3807\n",
      "Epsilon=0.830157 Action_times=1882096 Epoche=3808\n",
      "Epsilon=0.830028 Action_times=1883668 Epoche=3809\n",
      "Epsilon=0.829952 Action_times=1884595 Epoche=3810\n",
      "Epsilon=0.829908 Action_times=1885129 Epoche=3811\n",
      "Epsilon=0.829732 Action_times=1887279 Epoche=3812\n",
      "Epsilon=0.829503 Action_times=1890073 Epoche=3813\n",
      "Epsilon=0.829410 Action_times=1891202 Epoche=3814\n",
      "Epsilon=0.829324 Action_times=1892256 Epoche=3815\n",
      "Epsilon=0.829250 Action_times=1893156 Epoche=3816\n",
      "Epsilon=0.829168 Action_times=1894162 Epoche=3817\n",
      "Epsilon=0.829064 Action_times=1895431 Epoche=3818\n",
      "Epsilon=0.828975 Action_times=1896514 Epoche=3819\n",
      "Epsilon=0.828889 Action_times=1897565 Epoche=3820\n",
      "Epsilon=0.828773 Action_times=1898975 Epoche=3821\n",
      "Epsilon=0.828666 Action_times=1900286 Epoche=3822\n",
      "Epsilon=0.828608 Action_times=1900994 Epoche=3823\n",
      "Epsilon=0.828443 Action_times=1903008 Epoche=3824\n",
      "Epsilon=0.828369 Action_times=1903911 Epoche=3825\n",
      "Epsilon=0.828354 Action_times=1904104 Epoche=3826\n",
      "Epsilon=0.828106 Action_times=1907133 Epoche=3827\n",
      "Epsilon=0.828084 Action_times=1907396 Epoche=3828\n",
      "Epsilon=0.827869 Action_times=1910030 Epoche=3829\n",
      "Epsilon=0.827688 Action_times=1912245 Epoche=3830\n",
      "Epsilon=0.827572 Action_times=1913657 Epoche=3831\n",
      "Epsilon=0.827392 Action_times=1915864 Epoche=3832\n",
      "Epsilon=0.827136 Action_times=1918996 Epoche=3833\n",
      "Epsilon=0.826924 Action_times=1921583 Epoche=3834\n",
      "Epsilon=0.826735 Action_times=1923904 Epoche=3835\n",
      "Epsilon=0.826419 Action_times=1927773 Epoche=3836\n",
      "Epsilon=0.826354 Action_times=1928569 Epoche=3837\n",
      "Epsilon=0.826314 Action_times=1929064 Epoche=3838\n",
      "Epsilon=0.826227 Action_times=1930121 Epoche=3839\n",
      "Epsilon=0.825957 Action_times=1933436 Epoche=3840\n",
      "Epsilon=0.825580 Action_times=1938057 Epoche=3841\n",
      "Epsilon=0.825479 Action_times=1939287 Epoche=3842\n",
      "Epsilon=0.825379 Action_times=1940516 Epoche=3843\n",
      "Epsilon=0.825258 Action_times=1942001 Epoche=3844\n",
      "Epsilon=0.825192 Action_times=1942815 Epoche=3845\n",
      "Epsilon=0.825170 Action_times=1943087 Epoche=3846\n",
      "Epsilon=0.825044 Action_times=1944627 Epoche=3847\n",
      "Epsilon=0.825010 Action_times=1945049 Epoche=3848\n",
      "Epsilon=0.824989 Action_times=1945302 Epoche=3849\n",
      "Epsilon=0.824909 Action_times=1946282 Epoche=3850\n",
      "Epsilon=0.824772 Action_times=1947962 Epoche=3851\n",
      "Epsilon=0.824539 Action_times=1950831 Epoche=3852\n",
      "Epsilon=0.824431 Action_times=1952155 Epoche=3853\n",
      "Epsilon=0.824253 Action_times=1954343 Epoche=3854\n",
      "Epsilon=0.824068 Action_times=1956614 Epoche=3855\n",
      "Epsilon=0.823929 Action_times=1958319 Epoche=3856\n",
      "Epsilon=0.823889 Action_times=1958804 Epoche=3857\n",
      "Epsilon=0.823817 Action_times=1959696 Epoche=3858\n",
      "Epsilon=0.823746 Action_times=1960564 Epoche=3859\n",
      "Epsilon=0.823603 Action_times=1962328 Epoche=3860\n",
      "Epsilon=0.823547 Action_times=1963011 Epoche=3861\n",
      "Epsilon=0.823532 Action_times=1963201 Epoche=3862\n",
      "Epsilon=0.823438 Action_times=1964358 Epoche=3863\n",
      "Epsilon=0.823411 Action_times=1964682 Epoche=3864\n",
      "Epsilon=0.823322 Action_times=1965783 Epoche=3865\n",
      "Epsilon=0.823157 Action_times=1967813 Epoche=3866\n",
      "Epsilon=0.822896 Action_times=1971018 Epoche=3867\n",
      "Epsilon=0.822813 Action_times=1972035 Epoche=3868\n",
      "Epsilon=0.822692 Action_times=1973522 Epoche=3869\n",
      "Epsilon=0.822523 Action_times=1975610 Epoche=3870\n",
      "Epsilon=0.822319 Action_times=1978116 Epoche=3871\n",
      "Epsilon=0.822203 Action_times=1979543 Epoche=3872\n",
      "Epsilon=0.821959 Action_times=1982555 Epoche=3873\n",
      "Epsilon=0.821714 Action_times=1985566 Epoche=3874\n",
      "Epsilon=0.821530 Action_times=1987838 Epoche=3875\n",
      "Epsilon=0.821457 Action_times=1988740 Epoche=3876\n",
      "Epsilon=0.821286 Action_times=1990837 Epoche=3877\n",
      "Epsilon=0.821154 Action_times=1992469 Epoche=3878\n",
      "Epsilon=0.820987 Action_times=1994530 Epoche=3879\n",
      "Epsilon=0.820863 Action_times=1996061 Epoche=3880\n",
      "Epsilon=0.820764 Action_times=1997285 Epoche=3881\n",
      "Epsilon=0.820627 Action_times=1998970 Epoche=3882\n",
      "Epsilon=0.820502 Action_times=2000506 Epoche=3883\n",
      "Epsilon=0.820401 Action_times=2001755 Epoche=3884\n",
      "Epsilon=0.820198 Action_times=2004261 Epoche=3885\n",
      "Epsilon=0.819982 Action_times=2006925 Epoche=3886\n",
      "Epsilon=0.819810 Action_times=2009051 Epoche=3887\n",
      "Epsilon=0.819787 Action_times=2009335 Epoche=3888\n",
      "Epsilon=0.819659 Action_times=2010915 Epoche=3889\n",
      "Epsilon=0.819431 Action_times=2013729 Epoche=3890\n",
      "Epsilon=0.819350 Action_times=2014731 Epoche=3891\n",
      "Epsilon=0.819167 Action_times=2017000 Epoche=3892\n",
      "Epsilon=0.818945 Action_times=2019735 Epoche=3893\n",
      "Epsilon=0.818812 Action_times=2021390 Epoche=3894\n",
      "Epsilon=0.818683 Action_times=2022975 Epoche=3895\n",
      "Epsilon=0.818556 Action_times=2024549 Epoche=3896\n",
      "Epsilon=0.818454 Action_times=2025816 Epoche=3897\n",
      "Epsilon=0.818362 Action_times=2026951 Epoche=3898\n",
      "Epsilon=0.818298 Action_times=2027739 Epoche=3899\n",
      "Epsilon=0.818263 Action_times=2028177 Epoche=3900\n",
      "Epsilon=0.818221 Action_times=2028695 Epoche=3901\n",
      "Epsilon=0.818098 Action_times=2030217 Epoche=3902\n",
      "Epsilon=0.818027 Action_times=2031089 Epoche=3903\n",
      "Epsilon=0.817872 Action_times=2033016 Epoche=3904\n",
      "Epsilon=0.817819 Action_times=2033669 Epoche=3905\n",
      "Epsilon=0.817732 Action_times=2034741 Epoche=3906\n",
      "Epsilon=0.817608 Action_times=2036286 Epoche=3907\n",
      "Epsilon=0.817568 Action_times=2036771 Epoche=3908\n",
      "Epsilon=0.817411 Action_times=2038723 Epoche=3909\n",
      "Epsilon=0.817309 Action_times=2039983 Epoche=3910\n",
      "Epsilon=0.817222 Action_times=2041057 Epoche=3911\n",
      "Epsilon=0.817127 Action_times=2042245 Epoche=3912\n",
      "Epsilon=0.817005 Action_times=2043745 Epoche=3913\n",
      "Epsilon=0.816702 Action_times=2047511 Epoche=3914\n",
      "Epsilon=0.816527 Action_times=2049681 Epoche=3915\n",
      "Epsilon=0.816475 Action_times=2050317 Epoche=3916\n",
      "Epsilon=0.816313 Action_times=2052326 Epoche=3917\n",
      "Epsilon=0.816289 Action_times=2052633 Epoche=3918\n",
      "Epsilon=0.816175 Action_times=2054038 Epoche=3919\n",
      "Epsilon=0.816050 Action_times=2055591 Epoche=3920\n",
      "Epsilon=0.816022 Action_times=2055934 Epoche=3921\n",
      "Epsilon=0.815963 Action_times=2056676 Epoche=3922\n",
      "Epsilon=0.815924 Action_times=2057154 Epoche=3923\n",
      "Epsilon=0.815848 Action_times=2058093 Epoche=3924\n",
      "Epsilon=0.815760 Action_times=2059186 Epoche=3925\n",
      "Epsilon=0.815679 Action_times=2060193 Epoche=3926\n",
      "Epsilon=0.815554 Action_times=2061742 Epoche=3927\n",
      "Epsilon=0.815484 Action_times=2062620 Epoche=3928\n",
      "Epsilon=0.815413 Action_times=2063493 Epoche=3929\n",
      "Epsilon=0.815341 Action_times=2064394 Epoche=3930\n",
      "Epsilon=0.815304 Action_times=2064847 Epoche=3931\n",
      "Epsilon=0.815289 Action_times=2065039 Epoche=3932\n",
      "Epsilon=0.815248 Action_times=2065544 Epoche=3933\n",
      "Epsilon=0.815220 Action_times=2065889 Epoche=3934\n",
      "Epsilon=0.815184 Action_times=2066338 Epoche=3935\n",
      "Epsilon=0.815071 Action_times=2067745 Epoche=3936\n",
      "Epsilon=0.814772 Action_times=2071461 Epoche=3937\n",
      "Epsilon=0.814402 Action_times=2076052 Epoche=3938\n",
      "Epsilon=0.814264 Action_times=2077768 Epoche=3939\n",
      "Epsilon=0.814226 Action_times=2078245 Epoche=3940\n",
      "Epsilon=0.814080 Action_times=2080058 Epoche=3941\n",
      "Epsilon=0.813660 Action_times=2085288 Epoche=3942\n",
      "Epsilon=0.813542 Action_times=2086754 Epoche=3943\n",
      "Epsilon=0.813323 Action_times=2089480 Epoche=3944\n",
      "Epsilon=0.813263 Action_times=2090224 Epoche=3945\n",
      "Epsilon=0.813155 Action_times=2091571 Epoche=3946\n",
      "Epsilon=0.813081 Action_times=2092488 Epoche=3947\n",
      "Epsilon=0.812987 Action_times=2093662 Epoche=3948\n",
      "Epsilon=0.812885 Action_times=2094939 Epoche=3949\n",
      "Epsilon=0.812795 Action_times=2096052 Epoche=3950\n",
      "Epsilon=0.812588 Action_times=2098632 Epoche=3951\n",
      "Epsilon=0.812458 Action_times=2100253 Epoche=3952\n",
      "Epsilon=0.812418 Action_times=2100752 Epoche=3953\n",
      "Epsilon=0.812324 Action_times=2101919 Epoche=3954\n",
      "Epsilon=0.812291 Action_times=2102331 Epoche=3955\n",
      "Epsilon=0.812046 Action_times=2105395 Epoche=3956\n",
      "Epsilon=0.811788 Action_times=2108611 Epoche=3957\n",
      "Epsilon=0.811566 Action_times=2111372 Epoche=3958\n",
      "Epsilon=0.811550 Action_times=2111577 Epoche=3959\n",
      "Epsilon=0.811386 Action_times=2113617 Epoche=3960\n",
      "Epsilon=0.811227 Action_times=2115608 Epoche=3961\n",
      "Epsilon=0.811081 Action_times=2117424 Epoche=3962\n",
      "Epsilon=0.810998 Action_times=2118461 Epoche=3963\n",
      "Epsilon=0.810966 Action_times=2118866 Epoche=3964\n",
      "Epsilon=0.810899 Action_times=2119698 Epoche=3965\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.810848 Action_times=2120341 Epoche=3966\n",
      "Epsilon=0.810804 Action_times=2120886 Epoche=3967\n",
      "Epsilon=0.810695 Action_times=2122243 Epoche=3968\n",
      "Epsilon=0.810597 Action_times=2123473 Epoche=3969\n",
      "Epsilon=0.810566 Action_times=2123862 Epoche=3970\n",
      "Epsilon=0.810544 Action_times=2124129 Epoche=3971\n",
      "Epsilon=0.810432 Action_times=2125538 Epoche=3972\n",
      "Epsilon=0.810351 Action_times=2126544 Epoche=3973\n",
      "Epsilon=0.810041 Action_times=2130425 Epoche=3974\n",
      "Epsilon=0.809872 Action_times=2132532 Epoche=3975\n",
      "Epsilon=0.809706 Action_times=2134609 Epoche=3976\n",
      "Epsilon=0.809616 Action_times=2135731 Epoche=3977\n",
      "Epsilon=0.809539 Action_times=2136699 Epoche=3978\n",
      "Epsilon=0.809462 Action_times=2137656 Epoche=3979\n",
      "Epsilon=0.809421 Action_times=2138177 Epoche=3980\n",
      "Epsilon=0.809327 Action_times=2139342 Epoche=3981\n",
      "Epsilon=0.809293 Action_times=2139770 Epoche=3982\n",
      "Epsilon=0.809258 Action_times=2140212 Epoche=3983\n",
      "Epsilon=0.809237 Action_times=2140476 Epoche=3984\n",
      "Epsilon=0.809118 Action_times=2141958 Epoche=3985\n",
      "Epsilon=0.808984 Action_times=2143636 Epoche=3986\n",
      "Epsilon=0.808902 Action_times=2144672 Epoche=3987\n",
      "Epsilon=0.808760 Action_times=2146446 Epoche=3988\n",
      "Epsilon=0.808590 Action_times=2148576 Epoche=3989\n",
      "Epsilon=0.808579 Action_times=2148705 Epoche=3990\n",
      "Epsilon=0.808478 Action_times=2149979 Epoche=3991\n",
      "Epsilon=0.808448 Action_times=2150350 Epoche=3992\n",
      "Epsilon=0.808340 Action_times=2151705 Epoche=3993\n",
      "Epsilon=0.808204 Action_times=2153413 Epoche=3994\n",
      "Epsilon=0.808161 Action_times=2153949 Epoche=3995\n",
      "Epsilon=0.808080 Action_times=2154967 Epoche=3996\n",
      "Epsilon=0.807829 Action_times=2158110 Epoche=3997\n",
      "Epsilon=0.807682 Action_times=2159950 Epoche=3998\n",
      "Epsilon=0.807444 Action_times=2162931 Epoche=3999\n",
      "Epsilon=0.807424 Action_times=2163179 Epoche=4000\n",
      "Epsilon=0.807306 Action_times=2164669 Epoche=4001\n",
      "Epsilon=0.807257 Action_times=2165284 Epoche=4002\n",
      "Epsilon=0.807122 Action_times=2166976 Epoche=4003\n",
      "Epsilon=0.807100 Action_times=2167247 Epoche=4004\n",
      "Epsilon=0.807034 Action_times=2168072 Epoche=4005\n",
      "Epsilon=0.807022 Action_times=2168229 Epoche=4006\n",
      "Epsilon=0.806795 Action_times=2171076 Epoche=4007\n",
      "Epsilon=0.806687 Action_times=2172433 Epoche=4008\n",
      "Epsilon=0.806634 Action_times=2173090 Epoche=4009\n",
      "Epsilon=0.806603 Action_times=2173482 Epoche=4010\n",
      "Epsilon=0.806472 Action_times=2175129 Epoche=4011\n",
      "Epsilon=0.806335 Action_times=2176847 Epoche=4012\n",
      "Epsilon=0.806314 Action_times=2177118 Epoche=4013\n",
      "Epsilon=0.806001 Action_times=2181049 Epoche=4014\n",
      "Epsilon=0.805945 Action_times=2181744 Epoche=4015\n",
      "Epsilon=0.805891 Action_times=2182431 Epoche=4016\n",
      "Epsilon=0.805750 Action_times=2184200 Epoche=4017\n",
      "Epsilon=0.805713 Action_times=2184667 Epoche=4018\n",
      "Epsilon=0.805685 Action_times=2185019 Epoche=4019\n",
      "Epsilon=0.805629 Action_times=2185717 Epoche=4020\n",
      "Epsilon=0.805569 Action_times=2186473 Epoche=4021\n",
      "Epsilon=0.805498 Action_times=2187369 Epoche=4022\n",
      "Epsilon=0.805486 Action_times=2187511 Epoche=4023\n",
      "Epsilon=0.805431 Action_times=2188207 Epoche=4024\n",
      "Epsilon=0.805179 Action_times=2191378 Epoche=4025\n",
      "Epsilon=0.805087 Action_times=2192534 Epoche=4026\n",
      "Epsilon=0.805039 Action_times=2193137 Epoche=4027\n",
      "Epsilon=0.804964 Action_times=2194086 Epoche=4028\n",
      "Epsilon=0.804833 Action_times=2195723 Epoche=4029\n",
      "Epsilon=0.804720 Action_times=2197149 Epoche=4030\n",
      "Epsilon=0.804538 Action_times=2199436 Epoche=4031\n",
      "Epsilon=0.804482 Action_times=2200143 Epoche=4032\n",
      "Epsilon=0.804282 Action_times=2202660 Epoche=4033\n",
      "Epsilon=0.804046 Action_times=2205638 Epoche=4034\n",
      "Epsilon=0.803939 Action_times=2206989 Epoche=4035\n",
      "Epsilon=0.803839 Action_times=2208238 Epoche=4036\n",
      "Epsilon=0.803614 Action_times=2211082 Epoche=4037\n",
      "Epsilon=0.803539 Action_times=2212017 Epoche=4038\n",
      "Epsilon=0.803473 Action_times=2212858 Epoche=4039\n",
      "Epsilon=0.803341 Action_times=2214515 Epoche=4040\n",
      "Epsilon=0.803307 Action_times=2214948 Epoche=4041\n",
      "Epsilon=0.803241 Action_times=2215779 Epoche=4042\n",
      "Epsilon=0.803114 Action_times=2217386 Epoche=4043\n",
      "Epsilon=0.802983 Action_times=2219035 Epoche=4044\n",
      "Epsilon=0.802828 Action_times=2220987 Epoche=4045\n",
      "Epsilon=0.802759 Action_times=2221857 Epoche=4046\n",
      "Epsilon=0.802560 Action_times=2224367 Epoche=4047\n",
      "Epsilon=0.802364 Action_times=2226835 Epoche=4048\n",
      "Epsilon=0.802278 Action_times=2227926 Epoche=4049\n",
      "Epsilon=0.802157 Action_times=2229449 Epoche=4050\n",
      "Epsilon=0.801989 Action_times=2231575 Epoche=4051\n",
      "Epsilon=0.801824 Action_times=2233661 Epoche=4052\n",
      "Epsilon=0.801672 Action_times=2235576 Epoche=4053\n",
      "Epsilon=0.801582 Action_times=2236713 Epoche=4054\n",
      "Epsilon=0.801484 Action_times=2237948 Epoche=4055\n",
      "Epsilon=0.801406 Action_times=2238940 Epoche=4056\n",
      "Epsilon=0.801310 Action_times=2240156 Epoche=4057\n",
      "Epsilon=0.801174 Action_times=2241872 Epoche=4058\n",
      "Epsilon=0.801116 Action_times=2242609 Epoche=4059\n",
      "Epsilon=0.800875 Action_times=2245656 Epoche=4060\n",
      "Epsilon=0.800792 Action_times=2246701 Epoche=4061\n",
      "Epsilon=0.800643 Action_times=2248588 Epoche=4062\n",
      "Epsilon=0.800526 Action_times=2250065 Epoche=4063\n",
      "Epsilon=0.800377 Action_times=2251954 Epoche=4064\n",
      "Epsilon=0.800332 Action_times=2252519 Epoche=4065\n",
      "Epsilon=0.800229 Action_times=2253820 Epoche=4066\n",
      "Epsilon=0.800068 Action_times=2255860 Epoche=4067\n",
      "Epsilon=0.800045 Action_times=2256153 Epoche=4068\n",
      "Epsilon=0.799991 Action_times=2256832 Epoche=4069\n",
      "Epsilon=0.799822 Action_times=2258971 Epoche=4070\n",
      "Epsilon=0.799816 Action_times=2259051 Epoche=4071\n",
      "Epsilon=0.799645 Action_times=2261214 Epoche=4072\n",
      "Epsilon=0.799523 Action_times=2262755 Epoche=4073\n",
      "Epsilon=0.799309 Action_times=2265469 Epoche=4074\n",
      "Epsilon=0.799247 Action_times=2266253 Epoche=4075\n",
      "Epsilon=0.799149 Action_times=2267503 Epoche=4076\n",
      "Epsilon=0.799024 Action_times=2269084 Epoche=4077\n",
      "Epsilon=0.798889 Action_times=2270797 Epoche=4078\n",
      "Epsilon=0.798804 Action_times=2271870 Epoche=4079\n",
      "Epsilon=0.798750 Action_times=2272549 Epoche=4080\n",
      "Epsilon=0.798692 Action_times=2273289 Epoche=4081\n",
      "Epsilon=0.798499 Action_times=2275732 Epoche=4082\n",
      "Epsilon=0.798387 Action_times=2277154 Epoche=4083\n",
      "Epsilon=0.798293 Action_times=2278348 Epoche=4084\n",
      "Epsilon=0.798236 Action_times=2279069 Epoche=4085\n",
      "Epsilon=0.798079 Action_times=2281071 Epoche=4086\n",
      "Epsilon=0.797913 Action_times=2283177 Epoche=4087\n",
      "Epsilon=0.797822 Action_times=2284329 Epoche=4088\n",
      "Epsilon=0.797605 Action_times=2287078 Epoche=4089\n",
      "Epsilon=0.797221 Action_times=2291953 Epoche=4090\n",
      "Epsilon=0.797137 Action_times=2293031 Epoche=4091\n",
      "Epsilon=0.796966 Action_times=2295205 Epoche=4092\n",
      "Epsilon=0.796924 Action_times=2295738 Epoche=4093\n",
      "Epsilon=0.796787 Action_times=2297469 Epoche=4094\n",
      "Epsilon=0.796726 Action_times=2298248 Epoche=4095\n",
      "Epsilon=0.796572 Action_times=2300210 Epoche=4096\n",
      "Epsilon=0.796415 Action_times=2302197 Epoche=4097\n",
      "Epsilon=0.796374 Action_times=2302724 Epoche=4098\n",
      "Epsilon=0.796312 Action_times=2303519 Epoche=4099\n",
      "Epsilon=0.796213 Action_times=2304774 Epoche=4100\n",
      "Epsilon=0.796072 Action_times=2306569 Epoche=4101\n",
      "Epsilon=0.796012 Action_times=2307324 Epoche=4102\n",
      "Epsilon=0.795931 Action_times=2308361 Epoche=4103\n",
      "Epsilon=0.795889 Action_times=2308890 Epoche=4104\n",
      "Epsilon=0.795804 Action_times=2309973 Epoche=4105\n",
      "Epsilon=0.795617 Action_times=2312355 Epoche=4106\n",
      "Epsilon=0.795479 Action_times=2314111 Epoche=4107\n",
      "Epsilon=0.795281 Action_times=2316637 Epoche=4108\n",
      "Epsilon=0.795137 Action_times=2318468 Epoche=4109\n",
      "Epsilon=0.795041 Action_times=2319687 Epoche=4110\n",
      "Epsilon=0.795023 Action_times=2319921 Epoche=4111\n",
      "Epsilon=0.794972 Action_times=2320571 Epoche=4112\n",
      "Epsilon=0.794872 Action_times=2321841 Epoche=4113\n",
      "Epsilon=0.794726 Action_times=2323701 Epoche=4114\n",
      "Epsilon=0.794698 Action_times=2324054 Epoche=4115\n",
      "Epsilon=0.794691 Action_times=2324146 Epoche=4116\n",
      "Epsilon=0.794556 Action_times=2325871 Epoche=4117\n",
      "Epsilon=0.794551 Action_times=2325938 Epoche=4118\n",
      "Epsilon=0.794433 Action_times=2327436 Epoche=4119\n",
      "Epsilon=0.794341 Action_times=2328617 Epoche=4120\n",
      "Epsilon=0.794267 Action_times=2329555 Epoche=4121\n",
      "Epsilon=0.794165 Action_times=2330857 Epoche=4122\n",
      "Epsilon=0.794031 Action_times=2332563 Epoche=4123\n",
      "Epsilon=0.793868 Action_times=2334639 Epoche=4124\n",
      "Epsilon=0.793795 Action_times=2335579 Epoche=4125\n",
      "Epsilon=0.793694 Action_times=2336861 Epoche=4126\n",
      "Epsilon=0.793659 Action_times=2337309 Epoche=4127\n",
      "Epsilon=0.793590 Action_times=2338187 Epoche=4128\n",
      "Epsilon=0.793541 Action_times=2338813 Epoche=4129\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.793532 Action_times=2338925 Epoche=4130\n",
      "Epsilon=0.793414 Action_times=2340432 Epoche=4131\n",
      "Epsilon=0.793403 Action_times=2340579 Epoche=4132\n",
      "Epsilon=0.793284 Action_times=2342098 Epoche=4133\n",
      "Epsilon=0.793246 Action_times=2342577 Epoche=4134\n",
      "Epsilon=0.793149 Action_times=2343816 Epoche=4135\n",
      "Epsilon=0.793017 Action_times=2345505 Epoche=4136\n",
      "Epsilon=0.792962 Action_times=2346202 Epoche=4137\n",
      "Epsilon=0.792841 Action_times=2347753 Epoche=4138\n",
      "Epsilon=0.792722 Action_times=2349275 Epoche=4139\n",
      "Epsilon=0.792653 Action_times=2350159 Epoche=4140\n",
      "Epsilon=0.792594 Action_times=2350907 Epoche=4141\n",
      "Epsilon=0.792450 Action_times=2352754 Epoche=4142\n",
      "Epsilon=0.792388 Action_times=2353538 Epoche=4143\n",
      "Epsilon=0.792362 Action_times=2353876 Epoche=4144\n",
      "Epsilon=0.792234 Action_times=2355504 Epoche=4145\n",
      "Epsilon=0.792108 Action_times=2357121 Epoche=4146\n",
      "Epsilon=0.791918 Action_times=2359557 Epoche=4147\n",
      "Epsilon=0.791892 Action_times=2359888 Epoche=4148\n",
      "Epsilon=0.791790 Action_times=2361191 Epoche=4149\n",
      "Epsilon=0.791637 Action_times=2363139 Epoche=4150\n",
      "Epsilon=0.791610 Action_times=2363491 Epoche=4151\n",
      "Epsilon=0.791572 Action_times=2363976 Epoche=4152\n",
      "Epsilon=0.791380 Action_times=2366432 Epoche=4153\n",
      "Epsilon=0.791302 Action_times=2367432 Epoche=4154\n",
      "Epsilon=0.791171 Action_times=2369110 Epoche=4155\n",
      "Epsilon=0.790994 Action_times=2371372 Epoche=4156\n",
      "Epsilon=0.790937 Action_times=2372105 Epoche=4157\n",
      "Epsilon=0.790883 Action_times=2372801 Epoche=4158\n",
      "Epsilon=0.790853 Action_times=2373181 Epoche=4159\n",
      "Epsilon=0.790800 Action_times=2373855 Epoche=4160\n",
      "Epsilon=0.790695 Action_times=2375210 Epoche=4161\n",
      "Epsilon=0.790511 Action_times=2377560 Epoche=4162\n",
      "Epsilon=0.790470 Action_times=2378084 Epoche=4163\n",
      "Epsilon=0.790409 Action_times=2378871 Epoche=4164\n",
      "Epsilon=0.790366 Action_times=2379421 Epoche=4165\n",
      "Epsilon=0.790342 Action_times=2379725 Epoche=4166\n",
      "Epsilon=0.790273 Action_times=2380610 Epoche=4167\n",
      "Epsilon=0.790182 Action_times=2381776 Epoche=4168\n",
      "Epsilon=0.790021 Action_times=2383840 Epoche=4169\n",
      "Epsilon=0.789875 Action_times=2385707 Epoche=4170\n",
      "Epsilon=0.789826 Action_times=2386337 Epoche=4171\n",
      "Epsilon=0.789755 Action_times=2387252 Epoche=4172\n",
      "Epsilon=0.789616 Action_times=2389030 Epoche=4173\n",
      "Epsilon=0.789294 Action_times=2393165 Epoche=4174\n",
      "Epsilon=0.789197 Action_times=2394412 Epoche=4175\n",
      "Epsilon=0.789125 Action_times=2395338 Epoche=4176\n",
      "Epsilon=0.789055 Action_times=2396232 Epoche=4177\n",
      "Epsilon=0.788959 Action_times=2397470 Epoche=4178\n",
      "Epsilon=0.788853 Action_times=2398830 Epoche=4179\n",
      "Epsilon=0.788518 Action_times=2403126 Epoche=4180\n",
      "Epsilon=0.788226 Action_times=2406880 Epoche=4181\n",
      "Epsilon=0.788211 Action_times=2407068 Epoche=4182\n",
      "Epsilon=0.788178 Action_times=2407494 Epoche=4183\n",
      "Epsilon=0.788130 Action_times=2408119 Epoche=4184\n",
      "Epsilon=0.787993 Action_times=2409869 Epoche=4185\n",
      "Epsilon=0.787966 Action_times=2410217 Epoche=4186\n",
      "Epsilon=0.787905 Action_times=2411002 Epoche=4187\n",
      "Epsilon=0.787874 Action_times=2411407 Epoche=4188\n",
      "Epsilon=0.787789 Action_times=2412499 Epoche=4189\n",
      "Epsilon=0.787685 Action_times=2413838 Epoche=4190\n",
      "Epsilon=0.787359 Action_times=2418027 Epoche=4191\n",
      "Epsilon=0.787275 Action_times=2419111 Epoche=4192\n",
      "Epsilon=0.787251 Action_times=2419419 Epoche=4193\n",
      "Epsilon=0.787077 Action_times=2421660 Epoche=4194\n",
      "Epsilon=0.786804 Action_times=2425172 Epoche=4195\n",
      "Epsilon=0.786742 Action_times=2425961 Epoche=4196\n",
      "Epsilon=0.786628 Action_times=2427430 Epoche=4197\n",
      "Epsilon=0.786573 Action_times=2428138 Epoche=4198\n",
      "Epsilon=0.786524 Action_times=2428780 Epoche=4199\n",
      "Epsilon=0.786438 Action_times=2429879 Epoche=4200\n",
      "Epsilon=0.786297 Action_times=2431703 Epoche=4201\n",
      "Epsilon=0.786240 Action_times=2432436 Epoche=4202\n",
      "Epsilon=0.786170 Action_times=2433333 Epoche=4203\n",
      "Epsilon=0.786113 Action_times=2434072 Epoche=4204\n",
      "Epsilon=0.786044 Action_times=2434962 Epoche=4205\n",
      "Epsilon=0.785979 Action_times=2435793 Epoche=4206\n",
      "Epsilon=0.785781 Action_times=2438350 Epoche=4207\n",
      "Epsilon=0.785659 Action_times=2439918 Epoche=4208\n",
      "Epsilon=0.785565 Action_times=2441136 Epoche=4209\n",
      "Epsilon=0.785314 Action_times=2444371 Epoche=4210\n",
      "Epsilon=0.785296 Action_times=2444595 Epoche=4211\n",
      "Epsilon=0.785095 Action_times=2447199 Epoche=4212\n",
      "Epsilon=0.784925 Action_times=2449387 Epoche=4213\n",
      "Epsilon=0.784834 Action_times=2450555 Epoche=4214\n",
      "Epsilon=0.784796 Action_times=2451058 Epoche=4215\n",
      "Epsilon=0.784739 Action_times=2451784 Epoche=4216\n",
      "Epsilon=0.784692 Action_times=2452399 Epoche=4217\n",
      "Epsilon=0.784509 Action_times=2454759 Epoche=4218\n",
      "Epsilon=0.784446 Action_times=2455570 Epoche=4219\n",
      "Epsilon=0.784347 Action_times=2456843 Epoche=4220\n",
      "Epsilon=0.784217 Action_times=2458522 Epoche=4221\n",
      "Epsilon=0.784034 Action_times=2460896 Epoche=4222\n",
      "Epsilon=0.783996 Action_times=2461383 Epoche=4223\n",
      "Epsilon=0.783951 Action_times=2461961 Epoche=4224\n",
      "Epsilon=0.783835 Action_times=2463458 Epoche=4225\n",
      "Epsilon=0.783772 Action_times=2464283 Epoche=4226\n",
      "Epsilon=0.783671 Action_times=2465577 Epoche=4227\n",
      "Epsilon=0.783563 Action_times=2466981 Epoche=4228\n",
      "Epsilon=0.783478 Action_times=2468082 Epoche=4229\n",
      "Epsilon=0.783358 Action_times=2469635 Epoche=4230\n",
      "Epsilon=0.783124 Action_times=2472650 Epoche=4231\n",
      "Epsilon=0.782991 Action_times=2474380 Epoche=4232\n",
      "Epsilon=0.782935 Action_times=2475094 Epoche=4233\n",
      "Epsilon=0.782895 Action_times=2475611 Epoche=4234\n",
      "Epsilon=0.782849 Action_times=2476213 Epoche=4235\n",
      "Epsilon=0.782822 Action_times=2476558 Epoche=4236\n",
      "Epsilon=0.782669 Action_times=2478547 Epoche=4237\n",
      "Epsilon=0.782535 Action_times=2480271 Epoche=4238\n",
      "Epsilon=0.782488 Action_times=2480885 Epoche=4239\n",
      "Epsilon=0.782372 Action_times=2482381 Epoche=4240\n",
      "Epsilon=0.782305 Action_times=2483254 Epoche=4241\n",
      "Epsilon=0.782190 Action_times=2484737 Epoche=4242\n",
      "Epsilon=0.782149 Action_times=2485276 Epoche=4243\n",
      "Epsilon=0.782095 Action_times=2485974 Epoche=4244\n",
      "Epsilon=0.782028 Action_times=2486837 Epoche=4245\n",
      "Epsilon=0.781929 Action_times=2488120 Epoche=4246\n",
      "Epsilon=0.781821 Action_times=2489526 Epoche=4247\n",
      "Epsilon=0.781776 Action_times=2490110 Epoche=4248\n",
      "Epsilon=0.781614 Action_times=2492207 Epoche=4249\n",
      "Epsilon=0.781541 Action_times=2493156 Epoche=4250\n",
      "Epsilon=0.781501 Action_times=2493673 Epoche=4251\n",
      "Epsilon=0.781362 Action_times=2495475 Epoche=4252\n",
      "Epsilon=0.781270 Action_times=2496670 Epoche=4253\n",
      "Epsilon=0.781167 Action_times=2497997 Epoche=4254\n",
      "Epsilon=0.781110 Action_times=2498734 Epoche=4255\n",
      "Epsilon=0.780888 Action_times=2501615 Epoche=4256\n",
      "Epsilon=0.780694 Action_times=2504134 Epoche=4257\n",
      "Epsilon=0.780613 Action_times=2505182 Epoche=4258\n",
      "Epsilon=0.780522 Action_times=2506367 Epoche=4259\n",
      "Epsilon=0.780486 Action_times=2506834 Epoche=4260\n",
      "Epsilon=0.780300 Action_times=2509251 Epoche=4261\n",
      "Epsilon=0.780159 Action_times=2511085 Epoche=4262\n",
      "Epsilon=0.779945 Action_times=2513862 Epoche=4263\n",
      "Epsilon=0.779812 Action_times=2515580 Epoche=4264\n",
      "Epsilon=0.779552 Action_times=2518960 Epoche=4265\n",
      "Epsilon=0.779471 Action_times=2520013 Epoche=4266\n",
      "Epsilon=0.779351 Action_times=2521577 Epoche=4267\n",
      "Epsilon=0.779247 Action_times=2522925 Epoche=4268\n",
      "Epsilon=0.779121 Action_times=2524561 Epoche=4269\n",
      "Epsilon=0.778786 Action_times=2528918 Epoche=4270\n",
      "Epsilon=0.778777 Action_times=2529039 Epoche=4271\n",
      "Epsilon=0.778620 Action_times=2531080 Epoche=4272\n",
      "Epsilon=0.778578 Action_times=2531626 Epoche=4273\n",
      "Epsilon=0.778565 Action_times=2531802 Epoche=4274\n",
      "Epsilon=0.778525 Action_times=2532312 Epoche=4275\n",
      "Epsilon=0.778373 Action_times=2534295 Epoche=4276\n",
      "Epsilon=0.778229 Action_times=2536166 Epoche=4277\n",
      "Epsilon=0.777950 Action_times=2539802 Epoche=4278\n",
      "Epsilon=0.777752 Action_times=2542381 Epoche=4279\n",
      "Epsilon=0.777596 Action_times=2544409 Epoche=4280\n",
      "Epsilon=0.777562 Action_times=2544855 Epoche=4281\n",
      "Epsilon=0.777555 Action_times=2544952 Epoche=4282\n",
      "Epsilon=0.777511 Action_times=2545525 Epoche=4283\n",
      "Epsilon=0.777308 Action_times=2548171 Epoche=4284\n",
      "Epsilon=0.777197 Action_times=2549609 Epoche=4285\n",
      "Epsilon=0.777080 Action_times=2551144 Epoche=4286\n",
      "Epsilon=0.776957 Action_times=2552736 Epoche=4287\n",
      "Epsilon=0.776923 Action_times=2553183 Epoche=4288\n",
      "Epsilon=0.776817 Action_times=2554565 Epoche=4289\n",
      "Epsilon=0.776690 Action_times=2556224 Epoche=4290\n",
      "Epsilon=0.776552 Action_times=2558028 Epoche=4291\n",
      "Epsilon=0.776523 Action_times=2558399 Epoche=4292\n",
      "Epsilon=0.776415 Action_times=2559817 Epoche=4293\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.776283 Action_times=2561529 Epoche=4294\n",
      "Epsilon=0.775988 Action_times=2565380 Epoche=4295\n",
      "Epsilon=0.775905 Action_times=2566473 Epoche=4296\n",
      "Epsilon=0.775847 Action_times=2567228 Epoche=4297\n",
      "Epsilon=0.775706 Action_times=2569064 Epoche=4298\n",
      "Epsilon=0.775580 Action_times=2570710 Epoche=4299\n",
      "Epsilon=0.775495 Action_times=2571824 Epoche=4300\n",
      "Epsilon=0.775397 Action_times=2573097 Epoche=4301\n",
      "Epsilon=0.775332 Action_times=2573957 Epoche=4302\n",
      "Epsilon=0.775277 Action_times=2574674 Epoche=4303\n",
      "Epsilon=0.775120 Action_times=2576725 Epoche=4304\n",
      "Epsilon=0.775041 Action_times=2577752 Epoche=4305\n",
      "Epsilon=0.774957 Action_times=2578854 Epoche=4306\n",
      "Epsilon=0.774816 Action_times=2580692 Epoche=4307\n",
      "Epsilon=0.774781 Action_times=2581158 Epoche=4308\n",
      "Epsilon=0.774742 Action_times=2581663 Epoche=4309\n",
      "Epsilon=0.774561 Action_times=2584029 Epoche=4310\n",
      "Epsilon=0.774495 Action_times=2584890 Epoche=4311\n",
      "Epsilon=0.774398 Action_times=2586167 Epoche=4312\n",
      "Epsilon=0.774243 Action_times=2588188 Epoche=4313\n",
      "Epsilon=0.774176 Action_times=2589072 Epoche=4314\n",
      "Epsilon=0.774030 Action_times=2590976 Epoche=4315\n",
      "Epsilon=0.773847 Action_times=2593375 Epoche=4316\n",
      "Epsilon=0.773500 Action_times=2597913 Epoche=4317\n",
      "Epsilon=0.773335 Action_times=2600075 Epoche=4318\n",
      "Epsilon=0.773154 Action_times=2602446 Epoche=4319\n",
      "Epsilon=0.773084 Action_times=2603363 Epoche=4320\n",
      "Epsilon=0.773030 Action_times=2604079 Epoche=4321\n",
      "Epsilon=0.772995 Action_times=2604533 Epoche=4322\n",
      "Epsilon=0.772927 Action_times=2605424 Epoche=4323\n",
      "Epsilon=0.772752 Action_times=2607724 Epoche=4324\n",
      "Epsilon=0.772715 Action_times=2608206 Epoche=4325\n",
      "Epsilon=0.772613 Action_times=2609543 Epoche=4326\n",
      "Epsilon=0.772441 Action_times=2611796 Epoche=4327\n",
      "Epsilon=0.772248 Action_times=2614329 Epoche=4328\n",
      "Epsilon=0.772162 Action_times=2615457 Epoche=4329\n",
      "Epsilon=0.772134 Action_times=2615822 Epoche=4330\n",
      "Epsilon=0.772091 Action_times=2616394 Epoche=4331\n",
      "Epsilon=0.772036 Action_times=2617114 Epoche=4332\n",
      "Epsilon=0.771893 Action_times=2618985 Epoche=4333\n",
      "Epsilon=0.771819 Action_times=2619954 Epoche=4334\n",
      "Epsilon=0.771735 Action_times=2621060 Epoche=4335\n",
      "Epsilon=0.771673 Action_times=2621872 Epoche=4336\n",
      "Epsilon=0.771505 Action_times=2624076 Epoche=4337\n",
      "Epsilon=0.771497 Action_times=2624184 Epoche=4338\n",
      "Epsilon=0.771397 Action_times=2625500 Epoche=4339\n",
      "Epsilon=0.771317 Action_times=2626551 Epoche=4340\n",
      "Epsilon=0.771129 Action_times=2629027 Epoche=4341\n",
      "Epsilon=0.770969 Action_times=2631129 Epoche=4342\n",
      "Epsilon=0.770782 Action_times=2633586 Epoche=4343\n",
      "Epsilon=0.770592 Action_times=2636077 Epoche=4344\n",
      "Epsilon=0.770575 Action_times=2636303 Epoche=4345\n",
      "Epsilon=0.770424 Action_times=2638294 Epoche=4346\n",
      "Epsilon=0.770279 Action_times=2640192 Epoche=4347\n",
      "Epsilon=0.770119 Action_times=2642301 Epoche=4348\n",
      "Epsilon=0.769993 Action_times=2643961 Epoche=4349\n",
      "Epsilon=0.769845 Action_times=2645907 Epoche=4350\n",
      "Epsilon=0.769750 Action_times=2647158 Epoche=4351\n",
      "Epsilon=0.769634 Action_times=2648680 Epoche=4352\n",
      "Epsilon=0.769581 Action_times=2649382 Epoche=4353\n",
      "Epsilon=0.769469 Action_times=2650860 Epoche=4354\n",
      "Epsilon=0.769355 Action_times=2652360 Epoche=4355\n",
      "Epsilon=0.769340 Action_times=2652548 Epoche=4356\n",
      "Epsilon=0.769279 Action_times=2653363 Epoche=4357\n",
      "Epsilon=0.769205 Action_times=2654337 Epoche=4358\n",
      "Epsilon=0.769079 Action_times=2655991 Epoche=4359\n",
      "Epsilon=0.768995 Action_times=2657094 Epoche=4360\n",
      "Epsilon=0.768947 Action_times=2657727 Epoche=4361\n",
      "Epsilon=0.768890 Action_times=2658483 Epoche=4362\n",
      "Epsilon=0.768839 Action_times=2659147 Epoche=4363\n",
      "Epsilon=0.768708 Action_times=2660878 Epoche=4364\n",
      "Epsilon=0.768646 Action_times=2661700 Epoche=4365\n",
      "Epsilon=0.768543 Action_times=2663050 Epoche=4366\n",
      "Epsilon=0.768452 Action_times=2664258 Epoche=4367\n",
      "Epsilon=0.768388 Action_times=2665103 Epoche=4368\n",
      "Epsilon=0.768288 Action_times=2666422 Epoche=4369\n",
      "Epsilon=0.768136 Action_times=2668428 Epoche=4370\n",
      "Epsilon=0.767963 Action_times=2670702 Epoche=4371\n",
      "Epsilon=0.767914 Action_times=2671356 Epoche=4372\n",
      "Epsilon=0.767696 Action_times=2674228 Epoche=4373\n",
      "Epsilon=0.767658 Action_times=2674733 Epoche=4374\n",
      "Epsilon=0.767648 Action_times=2674854 Epoche=4375\n",
      "Epsilon=0.767516 Action_times=2676608 Epoche=4376\n",
      "Epsilon=0.767370 Action_times=2678535 Epoche=4377\n",
      "Epsilon=0.767302 Action_times=2679431 Epoche=4378\n",
      "Epsilon=0.767265 Action_times=2679920 Epoche=4379\n",
      "Epsilon=0.767179 Action_times=2681053 Epoche=4380\n",
      "Epsilon=0.767141 Action_times=2681560 Epoche=4381\n",
      "Epsilon=0.767040 Action_times=2682887 Epoche=4382\n",
      "Epsilon=0.766983 Action_times=2683643 Epoche=4383\n",
      "Epsilon=0.766960 Action_times=2683939 Epoche=4384\n",
      "Epsilon=0.766889 Action_times=2684885 Epoche=4385\n",
      "Epsilon=0.766871 Action_times=2685123 Epoche=4386\n",
      "Epsilon=0.766811 Action_times=2685909 Epoche=4387\n",
      "Epsilon=0.766626 Action_times=2688358 Epoche=4388\n",
      "Epsilon=0.766577 Action_times=2689009 Epoche=4389\n",
      "Epsilon=0.766563 Action_times=2689193 Epoche=4390\n",
      "Epsilon=0.766477 Action_times=2690324 Epoche=4391\n",
      "Epsilon=0.766419 Action_times=2691100 Epoche=4392\n",
      "Epsilon=0.766403 Action_times=2691312 Epoche=4393\n",
      "Epsilon=0.766233 Action_times=2693558 Epoche=4394\n",
      "Epsilon=0.766113 Action_times=2695144 Epoche=4395\n",
      "Epsilon=0.765951 Action_times=2697285 Epoche=4396\n",
      "Epsilon=0.765660 Action_times=2701139 Epoche=4397\n",
      "Epsilon=0.765363 Action_times=2705070 Epoche=4398\n",
      "Epsilon=0.765301 Action_times=2705881 Epoche=4399\n",
      "Epsilon=0.765239 Action_times=2706706 Epoche=4400\n",
      "Epsilon=0.765112 Action_times=2708386 Epoche=4401\n",
      "Epsilon=0.765067 Action_times=2708989 Epoche=4402\n",
      "Epsilon=0.764987 Action_times=2710046 Epoche=4403\n",
      "Epsilon=0.764831 Action_times=2712108 Epoche=4404\n",
      "Epsilon=0.764763 Action_times=2713007 Epoche=4405\n",
      "Epsilon=0.764613 Action_times=2715003 Epoche=4406\n",
      "Epsilon=0.764607 Action_times=2715080 Epoche=4407\n",
      "Epsilon=0.764518 Action_times=2716263 Epoche=4408\n",
      "Epsilon=0.764347 Action_times=2718520 Epoche=4409\n",
      "Epsilon=0.764225 Action_times=2720137 Epoche=4410\n",
      "Epsilon=0.764174 Action_times=2720812 Epoche=4411\n",
      "Epsilon=0.764113 Action_times=2721626 Epoche=4412\n",
      "Epsilon=0.764003 Action_times=2723080 Epoche=4413\n",
      "Epsilon=0.763924 Action_times=2724128 Epoche=4414\n",
      "Epsilon=0.763878 Action_times=2724738 Epoche=4415\n",
      "Epsilon=0.763736 Action_times=2726627 Epoche=4416\n",
      "Epsilon=0.763640 Action_times=2727895 Epoche=4417\n",
      "Epsilon=0.763617 Action_times=2728200 Epoche=4418\n",
      "Epsilon=0.763551 Action_times=2729083 Epoche=4419\n",
      "Epsilon=0.763508 Action_times=2729652 Epoche=4420\n",
      "Epsilon=0.763420 Action_times=2730825 Epoche=4421\n",
      "Epsilon=0.763382 Action_times=2731319 Epoche=4422\n",
      "Epsilon=0.763242 Action_times=2733187 Epoche=4423\n",
      "Epsilon=0.763220 Action_times=2733473 Epoche=4424\n",
      "Epsilon=0.763139 Action_times=2734558 Epoche=4425\n",
      "Epsilon=0.762955 Action_times=2737001 Epoche=4426\n",
      "Epsilon=0.762913 Action_times=2737549 Epoche=4427\n",
      "Epsilon=0.762745 Action_times=2739785 Epoche=4428\n",
      "Epsilon=0.762674 Action_times=2740730 Epoche=4429\n",
      "Epsilon=0.762560 Action_times=2742241 Epoche=4430\n",
      "Epsilon=0.762481 Action_times=2743291 Epoche=4431\n",
      "Epsilon=0.762454 Action_times=2743657 Epoche=4432\n",
      "Epsilon=0.762342 Action_times=2745133 Epoche=4433\n",
      "Epsilon=0.762302 Action_times=2745669 Epoche=4434\n",
      "Epsilon=0.762157 Action_times=2747603 Epoche=4435\n",
      "Epsilon=0.761896 Action_times=2751072 Epoche=4436\n",
      "Epsilon=0.761705 Action_times=2753614 Epoche=4437\n",
      "Epsilon=0.761678 Action_times=2753973 Epoche=4438\n",
      "Epsilon=0.761626 Action_times=2754656 Epoche=4439\n",
      "Epsilon=0.761603 Action_times=2754963 Epoche=4440\n",
      "Epsilon=0.761495 Action_times=2756405 Epoche=4441\n",
      "Epsilon=0.761448 Action_times=2757032 Epoche=4442\n",
      "Epsilon=0.761368 Action_times=2758088 Epoche=4443\n",
      "Epsilon=0.761213 Action_times=2760155 Epoche=4444\n",
      "Epsilon=0.761131 Action_times=2761246 Epoche=4445\n",
      "Epsilon=0.761058 Action_times=2762217 Epoche=4446\n",
      "Epsilon=0.760969 Action_times=2763410 Epoche=4447\n",
      "Epsilon=0.760860 Action_times=2764862 Epoche=4448\n",
      "Epsilon=0.760836 Action_times=2765171 Epoche=4449\n",
      "Epsilon=0.760689 Action_times=2767131 Epoche=4450\n",
      "Epsilon=0.760505 Action_times=2769583 Epoche=4451\n",
      "Epsilon=0.760329 Action_times=2771938 Epoche=4452\n",
      "Epsilon=0.760285 Action_times=2772514 Epoche=4453\n",
      "Epsilon=0.760237 Action_times=2773162 Epoche=4454\n",
      "Epsilon=0.760039 Action_times=2775802 Epoche=4455\n",
      "Epsilon=0.760024 Action_times=2776002 Epoche=4456\n",
      "Epsilon=0.759862 Action_times=2778156 Epoche=4457\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.759807 Action_times=2778885 Epoche=4458\n",
      "Epsilon=0.759780 Action_times=2779255 Epoche=4459\n",
      "Epsilon=0.759735 Action_times=2779857 Epoche=4460\n",
      "Epsilon=0.759652 Action_times=2780963 Epoche=4461\n",
      "Epsilon=0.759621 Action_times=2781377 Epoche=4462\n",
      "Epsilon=0.759600 Action_times=2781652 Epoche=4463\n",
      "Epsilon=0.759352 Action_times=2784957 Epoche=4464\n",
      "Epsilon=0.759274 Action_times=2786000 Epoche=4465\n",
      "Epsilon=0.759074 Action_times=2788667 Epoche=4466\n",
      "Epsilon=0.759030 Action_times=2789263 Epoche=4467\n",
      "Epsilon=0.758857 Action_times=2791573 Epoche=4468\n",
      "Epsilon=0.758855 Action_times=2791595 Epoche=4469\n",
      "Epsilon=0.758589 Action_times=2795144 Epoche=4470\n",
      "Epsilon=0.758535 Action_times=2795866 Epoche=4471\n",
      "Epsilon=0.758437 Action_times=2797173 Epoche=4472\n",
      "Epsilon=0.758279 Action_times=2799288 Epoche=4473\n",
      "Epsilon=0.758188 Action_times=2800509 Epoche=4474\n",
      "Epsilon=0.758107 Action_times=2801590 Epoche=4475\n",
      "Epsilon=0.757948 Action_times=2803716 Epoche=4476\n",
      "Epsilon=0.757835 Action_times=2805229 Epoche=4477\n",
      "Epsilon=0.757790 Action_times=2805829 Epoche=4478\n",
      "Epsilon=0.757688 Action_times=2807191 Epoche=4479\n",
      "Epsilon=0.757606 Action_times=2808293 Epoche=4480\n",
      "Epsilon=0.757520 Action_times=2809442 Epoche=4481\n",
      "Epsilon=0.757490 Action_times=2809843 Epoche=4482\n",
      "Epsilon=0.757337 Action_times=2811881 Epoche=4483\n",
      "Epsilon=0.757300 Action_times=2812388 Epoche=4484\n",
      "Epsilon=0.757221 Action_times=2813434 Epoche=4485\n",
      "Epsilon=0.757149 Action_times=2814399 Epoche=4486\n",
      "Epsilon=0.757057 Action_times=2815640 Epoche=4487\n",
      "Epsilon=0.756855 Action_times=2818337 Epoche=4488\n",
      "Epsilon=0.756724 Action_times=2820097 Epoche=4489\n",
      "Epsilon=0.756575 Action_times=2822086 Epoche=4490\n",
      "Epsilon=0.756414 Action_times=2824248 Epoche=4491\n",
      "Epsilon=0.756384 Action_times=2824644 Epoche=4492\n",
      "Epsilon=0.756232 Action_times=2826689 Epoche=4493\n",
      "Epsilon=0.756138 Action_times=2827939 Epoche=4494\n",
      "Epsilon=0.756001 Action_times=2829784 Epoche=4495\n",
      "Epsilon=0.755853 Action_times=2831764 Epoche=4496\n",
      "Epsilon=0.755807 Action_times=2832381 Epoche=4497\n",
      "Epsilon=0.755796 Action_times=2832527 Epoche=4498\n",
      "Epsilon=0.755677 Action_times=2834120 Epoche=4499\n",
      "Epsilon=0.755663 Action_times=2834308 Epoche=4500\n",
      "Epsilon=0.755513 Action_times=2836323 Epoche=4501\n",
      "Epsilon=0.755415 Action_times=2837644 Epoche=4502\n",
      "Epsilon=0.755249 Action_times=2839866 Epoche=4503\n",
      "Epsilon=0.755157 Action_times=2841101 Epoche=4504\n",
      "Epsilon=0.755141 Action_times=2841320 Epoche=4505\n",
      "Epsilon=0.754981 Action_times=2843465 Epoche=4506\n",
      "Epsilon=0.754761 Action_times=2846412 Epoche=4507\n",
      "Epsilon=0.754568 Action_times=2849003 Epoche=4508\n",
      "Epsilon=0.754472 Action_times=2850300 Epoche=4509\n",
      "Epsilon=0.754425 Action_times=2850926 Epoche=4510\n",
      "Epsilon=0.754369 Action_times=2851675 Epoche=4511\n",
      "Epsilon=0.754212 Action_times=2853796 Epoche=4512\n",
      "Epsilon=0.753987 Action_times=2856809 Epoche=4513\n",
      "Epsilon=0.753852 Action_times=2858625 Epoche=4514\n",
      "Epsilon=0.753795 Action_times=2859396 Epoche=4515\n",
      "Epsilon=0.753703 Action_times=2860629 Epoche=4516\n",
      "Epsilon=0.753646 Action_times=2861402 Epoche=4517\n",
      "Epsilon=0.753563 Action_times=2862509 Epoche=4518\n",
      "Epsilon=0.753553 Action_times=2862655 Epoche=4519\n",
      "Epsilon=0.753494 Action_times=2863449 Epoche=4520\n",
      "Epsilon=0.753444 Action_times=2864112 Epoche=4521\n",
      "Epsilon=0.753295 Action_times=2866120 Epoche=4522\n",
      "Epsilon=0.753251 Action_times=2866707 Epoche=4523\n",
      "Epsilon=0.753225 Action_times=2867062 Epoche=4524\n",
      "Epsilon=0.753128 Action_times=2868361 Epoche=4525\n",
      "Epsilon=0.753044 Action_times=2869502 Epoche=4526\n",
      "Epsilon=0.753009 Action_times=2869964 Epoche=4527\n",
      "Epsilon=0.752991 Action_times=2870215 Epoche=4528\n",
      "Epsilon=0.752948 Action_times=2870789 Epoche=4529\n",
      "Epsilon=0.752808 Action_times=2872679 Epoche=4530\n",
      "Epsilon=0.752749 Action_times=2873474 Epoche=4531\n",
      "Epsilon=0.752639 Action_times=2874944 Epoche=4532\n",
      "Epsilon=0.752609 Action_times=2875359 Epoche=4533\n",
      "Epsilon=0.752569 Action_times=2875893 Epoche=4534\n",
      "Epsilon=0.752539 Action_times=2876292 Epoche=4535\n",
      "Epsilon=0.752469 Action_times=2877238 Epoche=4536\n",
      "Epsilon=0.752399 Action_times=2878187 Epoche=4537\n",
      "Epsilon=0.752329 Action_times=2879126 Epoche=4538\n",
      "Epsilon=0.752298 Action_times=2879537 Epoche=4539\n",
      "Epsilon=0.752237 Action_times=2880359 Epoche=4540\n",
      "Epsilon=0.752191 Action_times=2880980 Epoche=4541\n",
      "Epsilon=0.752161 Action_times=2881393 Epoche=4542\n",
      "Epsilon=0.752074 Action_times=2882555 Epoche=4543\n",
      "Epsilon=0.752038 Action_times=2883046 Epoche=4544\n",
      "Epsilon=0.751953 Action_times=2884197 Epoche=4545\n",
      "Epsilon=0.751776 Action_times=2886571 Epoche=4546\n",
      "Epsilon=0.751632 Action_times=2888524 Epoche=4547\n",
      "Epsilon=0.751619 Action_times=2888689 Epoche=4548\n",
      "Epsilon=0.751499 Action_times=2890318 Epoche=4549\n",
      "Epsilon=0.751404 Action_times=2891591 Epoche=4550\n",
      "Epsilon=0.751361 Action_times=2892172 Epoche=4551\n",
      "Epsilon=0.751259 Action_times=2893542 Epoche=4552\n",
      "Epsilon=0.751125 Action_times=2895358 Epoche=4553\n",
      "Epsilon=0.750990 Action_times=2897182 Epoche=4554\n",
      "Epsilon=0.750876 Action_times=2898715 Epoche=4555\n",
      "Epsilon=0.750763 Action_times=2900236 Epoche=4556\n",
      "Epsilon=0.750656 Action_times=2901684 Epoche=4557\n",
      "Epsilon=0.750594 Action_times=2902530 Epoche=4558\n",
      "Epsilon=0.750398 Action_times=2905177 Epoche=4559\n",
      "Epsilon=0.750257 Action_times=2907081 Epoche=4560\n",
      "Epsilon=0.750233 Action_times=2907394 Epoche=4561\n",
      "Epsilon=0.750169 Action_times=2908265 Epoche=4562\n",
      "Epsilon=0.750108 Action_times=2909084 Epoche=4563\n",
      "Epsilon=0.750011 Action_times=2910402 Epoche=4564\n",
      "Epsilon=0.749992 Action_times=2910657 Epoche=4565\n",
      "Epsilon=0.749883 Action_times=2912135 Epoche=4566\n",
      "Epsilon=0.749741 Action_times=2914042 Epoche=4567\n",
      "Epsilon=0.749616 Action_times=2915737 Epoche=4568\n",
      "Epsilon=0.749585 Action_times=2916155 Epoche=4569\n",
      "Epsilon=0.749554 Action_times=2916573 Epoche=4570\n",
      "Epsilon=0.749478 Action_times=2917602 Epoche=4571\n",
      "Epsilon=0.749405 Action_times=2918598 Epoche=4572\n",
      "Epsilon=0.749367 Action_times=2919106 Epoche=4573\n",
      "Epsilon=0.749315 Action_times=2919814 Epoche=4574\n",
      "Epsilon=0.749205 Action_times=2921291 Epoche=4575\n",
      "Epsilon=0.749082 Action_times=2922954 Epoche=4576\n",
      "Epsilon=0.749026 Action_times=2923724 Epoche=4577\n",
      "Epsilon=0.748949 Action_times=2924765 Epoche=4578\n",
      "Epsilon=0.748871 Action_times=2925816 Epoche=4579\n",
      "Epsilon=0.748846 Action_times=2926148 Epoche=4580\n",
      "Epsilon=0.748773 Action_times=2927142 Epoche=4581\n",
      "Epsilon=0.748711 Action_times=2927975 Epoche=4582\n",
      "Epsilon=0.748678 Action_times=2928432 Epoche=4583\n",
      "Epsilon=0.748617 Action_times=2929253 Epoche=4584\n",
      "Epsilon=0.748602 Action_times=2929457 Epoche=4585\n",
      "Epsilon=0.748541 Action_times=2930286 Epoche=4586\n",
      "Epsilon=0.748458 Action_times=2931408 Epoche=4587\n",
      "Epsilon=0.748291 Action_times=2933665 Epoche=4588\n",
      "Epsilon=0.748188 Action_times=2935066 Epoche=4589\n",
      "Epsilon=0.748043 Action_times=2937030 Epoche=4590\n",
      "Epsilon=0.747941 Action_times=2938410 Epoche=4591\n",
      "Epsilon=0.747873 Action_times=2939329 Epoche=4592\n",
      "Epsilon=0.747748 Action_times=2941021 Epoche=4593\n",
      "Epsilon=0.747713 Action_times=2941499 Epoche=4594\n",
      "Epsilon=0.747648 Action_times=2942377 Epoche=4595\n",
      "Epsilon=0.747556 Action_times=2943629 Epoche=4596\n",
      "Epsilon=0.747501 Action_times=2944372 Epoche=4597\n",
      "Epsilon=0.747377 Action_times=2946052 Epoche=4598\n",
      "Epsilon=0.747205 Action_times=2948386 Epoche=4599\n",
      "Epsilon=0.747043 Action_times=2950584 Epoche=4600\n",
      "Epsilon=0.746989 Action_times=2951326 Epoche=4601\n",
      "Epsilon=0.746856 Action_times=2953122 Epoche=4602\n",
      "Epsilon=0.746769 Action_times=2954299 Epoche=4603\n",
      "Epsilon=0.746639 Action_times=2956069 Epoche=4604\n",
      "Epsilon=0.746551 Action_times=2957265 Epoche=4605\n",
      "Epsilon=0.746502 Action_times=2957935 Epoche=4606\n",
      "Epsilon=0.746441 Action_times=2958758 Epoche=4607\n",
      "Epsilon=0.746425 Action_times=2958976 Epoche=4608\n",
      "Epsilon=0.746396 Action_times=2959365 Epoche=4609\n",
      "Epsilon=0.746325 Action_times=2960336 Epoche=4610\n",
      "Epsilon=0.746303 Action_times=2960629 Epoche=4611\n",
      "Epsilon=0.746265 Action_times=2961152 Epoche=4612\n",
      "Epsilon=0.746237 Action_times=2961524 Epoche=4613\n",
      "Epsilon=0.746124 Action_times=2963062 Epoche=4614\n",
      "Epsilon=0.746073 Action_times=2963761 Epoche=4615\n",
      "Epsilon=0.746014 Action_times=2964558 Epoche=4616\n",
      "Epsilon=0.745998 Action_times=2964771 Epoche=4617\n",
      "Epsilon=0.745936 Action_times=2965622 Epoche=4618\n",
      "Epsilon=0.745823 Action_times=2967147 Epoche=4619\n",
      "Epsilon=0.745755 Action_times=2968073 Epoche=4620\n",
      "Epsilon=0.745689 Action_times=2968976 Epoche=4621\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.745604 Action_times=2970136 Epoche=4622\n",
      "Epsilon=0.745516 Action_times=2971321 Epoche=4623\n",
      "Epsilon=0.745431 Action_times=2972480 Epoche=4624\n",
      "Epsilon=0.745405 Action_times=2972829 Epoche=4625\n",
      "Epsilon=0.745346 Action_times=2973632 Epoche=4626\n",
      "Epsilon=0.745226 Action_times=2975276 Epoche=4627\n",
      "Epsilon=0.745132 Action_times=2976553 Epoche=4628\n",
      "Epsilon=0.745095 Action_times=2977050 Epoche=4629\n",
      "Epsilon=0.744940 Action_times=2979165 Epoche=4630\n",
      "Epsilon=0.744885 Action_times=2979913 Epoche=4631\n",
      "Epsilon=0.744859 Action_times=2980265 Epoche=4632\n",
      "Epsilon=0.744663 Action_times=2982936 Epoche=4633\n",
      "Epsilon=0.744526 Action_times=2984799 Epoche=4634\n",
      "Epsilon=0.744480 Action_times=2985420 Epoche=4635\n",
      "Epsilon=0.744320 Action_times=2987603 Epoche=4636\n",
      "Epsilon=0.744213 Action_times=2989064 Epoche=4637\n",
      "Epsilon=0.744176 Action_times=2989555 Epoche=4638\n",
      "Epsilon=0.744134 Action_times=2990132 Epoche=4639\n",
      "Epsilon=0.744031 Action_times=2991542 Epoche=4640\n",
      "Epsilon=0.743923 Action_times=2993014 Epoche=4641\n",
      "Epsilon=0.743882 Action_times=2993562 Epoche=4642\n",
      "Epsilon=0.743876 Action_times=2993652 Epoche=4643\n",
      "Epsilon=0.743745 Action_times=2995431 Epoche=4644\n",
      "Epsilon=0.743689 Action_times=2996202 Epoche=4645\n",
      "Epsilon=0.743609 Action_times=2997287 Epoche=4646\n",
      "Epsilon=0.743528 Action_times=2998389 Epoche=4647\n",
      "Epsilon=0.743452 Action_times=2999432 Epoche=4648\n",
      "Epsilon=0.743398 Action_times=3000159 Epoche=4649\n",
      "Epsilon=0.743233 Action_times=3002414 Epoche=4650\n",
      "Epsilon=0.743207 Action_times=3002765 Epoche=4651\n",
      "Epsilon=0.743095 Action_times=3004291 Epoche=4652\n",
      "Epsilon=0.742964 Action_times=3006082 Epoche=4653\n",
      "Epsilon=0.742898 Action_times=3006989 Epoche=4654\n",
      "Epsilon=0.742743 Action_times=3009101 Epoche=4655\n",
      "Epsilon=0.742591 Action_times=3011167 Epoche=4656\n",
      "Epsilon=0.742514 Action_times=3012224 Epoche=4657\n",
      "Epsilon=0.742489 Action_times=3012568 Epoche=4658\n",
      "Epsilon=0.742364 Action_times=3014277 Epoche=4659\n",
      "Epsilon=0.742202 Action_times=3016486 Epoche=4660\n",
      "Epsilon=0.742064 Action_times=3018374 Epoche=4661\n",
      "Epsilon=0.741886 Action_times=3020800 Epoche=4662\n",
      "Epsilon=0.741848 Action_times=3021323 Epoche=4663\n",
      "Epsilon=0.741679 Action_times=3023637 Epoche=4664\n",
      "Epsilon=0.741633 Action_times=3024253 Epoche=4665\n",
      "Epsilon=0.741575 Action_times=3025051 Epoche=4666\n",
      "Epsilon=0.741460 Action_times=3026622 Epoche=4667\n",
      "Epsilon=0.741363 Action_times=3027956 Epoche=4668\n",
      "Epsilon=0.741299 Action_times=3028826 Epoche=4669\n",
      "Epsilon=0.741148 Action_times=3030894 Epoche=4670\n",
      "Epsilon=0.741125 Action_times=3031201 Epoche=4671\n",
      "Epsilon=0.741097 Action_times=3031593 Epoche=4672\n",
      "Epsilon=0.740945 Action_times=3033666 Epoche=4673\n",
      "Epsilon=0.740828 Action_times=3035272 Epoche=4674\n",
      "Epsilon=0.740814 Action_times=3035458 Epoche=4675\n",
      "Epsilon=0.740741 Action_times=3036453 Epoche=4676\n",
      "Epsilon=0.740644 Action_times=3037790 Epoche=4677\n",
      "Epsilon=0.740627 Action_times=3038025 Epoche=4678\n",
      "Epsilon=0.740590 Action_times=3038528 Epoche=4679\n",
      "Epsilon=0.740543 Action_times=3039171 Epoche=4680\n",
      "Epsilon=0.740476 Action_times=3040079 Epoche=4681\n",
      "Epsilon=0.740434 Action_times=3040654 Epoche=4682\n",
      "Epsilon=0.740395 Action_times=3041201 Epoche=4683\n",
      "Epsilon=0.740333 Action_times=3042049 Epoche=4684\n",
      "Epsilon=0.740202 Action_times=3043834 Epoche=4685\n",
      "Epsilon=0.740040 Action_times=3046061 Epoche=4686\n",
      "Epsilon=0.739938 Action_times=3047453 Epoche=4687\n",
      "Epsilon=0.739856 Action_times=3048571 Epoche=4688\n",
      "Epsilon=0.739819 Action_times=3049077 Epoche=4689\n",
      "Epsilon=0.739773 Action_times=3049710 Epoche=4690\n",
      "Epsilon=0.739760 Action_times=3049893 Epoche=4691\n",
      "Epsilon=0.739681 Action_times=3050970 Epoche=4692\n",
      "Epsilon=0.739597 Action_times=3052126 Epoche=4693\n",
      "Epsilon=0.739480 Action_times=3053732 Epoche=4694\n",
      "Epsilon=0.739417 Action_times=3054598 Epoche=4695\n",
      "Epsilon=0.739042 Action_times=3059732 Epoche=4696\n",
      "Epsilon=0.738877 Action_times=3061999 Epoche=4697\n",
      "Epsilon=0.738811 Action_times=3062907 Epoche=4698\n",
      "Epsilon=0.738705 Action_times=3064358 Epoche=4699\n",
      "Epsilon=0.738538 Action_times=3066658 Epoche=4700\n",
      "Epsilon=0.738484 Action_times=3067394 Epoche=4701\n",
      "Epsilon=0.738351 Action_times=3069216 Epoche=4702\n",
      "Epsilon=0.738231 Action_times=3070864 Epoche=4703\n",
      "Epsilon=0.738139 Action_times=3072123 Epoche=4704\n",
      "Epsilon=0.738055 Action_times=3073279 Epoche=4705\n",
      "Epsilon=0.737972 Action_times=3074424 Epoche=4706\n",
      "Epsilon=0.737888 Action_times=3075576 Epoche=4707\n",
      "Epsilon=0.737840 Action_times=3076234 Epoche=4708\n",
      "Epsilon=0.737819 Action_times=3076526 Epoche=4709\n",
      "Epsilon=0.737760 Action_times=3077342 Epoche=4710\n",
      "Epsilon=0.737714 Action_times=3077969 Epoche=4711\n",
      "Epsilon=0.737623 Action_times=3079216 Epoche=4712\n",
      "Epsilon=0.737590 Action_times=3079675 Epoche=4713\n",
      "Epsilon=0.737571 Action_times=3079934 Epoche=4714\n",
      "Epsilon=0.737526 Action_times=3080553 Epoche=4715\n",
      "Epsilon=0.737433 Action_times=3081833 Epoche=4716\n",
      "Epsilon=0.737425 Action_times=3081937 Epoche=4717\n",
      "Epsilon=0.737313 Action_times=3083486 Epoche=4718\n",
      "Epsilon=0.737311 Action_times=3083502 Epoche=4719\n",
      "Epsilon=0.737297 Action_times=3083697 Epoche=4720\n",
      "Epsilon=0.737168 Action_times=3085475 Epoche=4721\n",
      "Epsilon=0.737019 Action_times=3087528 Epoche=4722\n",
      "Epsilon=0.736984 Action_times=3088009 Epoche=4723\n",
      "Epsilon=0.736801 Action_times=3090525 Epoche=4724\n",
      "Epsilon=0.736646 Action_times=3092654 Epoche=4725\n",
      "Epsilon=0.736526 Action_times=3094310 Epoche=4726\n",
      "Epsilon=0.736446 Action_times=3095406 Epoche=4727\n",
      "Epsilon=0.736333 Action_times=3096964 Epoche=4728\n",
      "Epsilon=0.736224 Action_times=3098469 Epoche=4729\n",
      "Epsilon=0.736062 Action_times=3100702 Epoche=4730\n",
      "Epsilon=0.735992 Action_times=3101662 Epoche=4731\n",
      "Epsilon=0.735943 Action_times=3102341 Epoche=4732\n",
      "Epsilon=0.735873 Action_times=3103295 Epoche=4733\n",
      "Epsilon=0.735776 Action_times=3104630 Epoche=4734\n",
      "Epsilon=0.735725 Action_times=3105331 Epoche=4735\n",
      "Epsilon=0.735616 Action_times=3106837 Epoche=4736\n",
      "Epsilon=0.735533 Action_times=3107985 Epoche=4737\n",
      "Epsilon=0.735392 Action_times=3109925 Epoche=4738\n",
      "Epsilon=0.735371 Action_times=3110217 Epoche=4739\n",
      "Epsilon=0.735313 Action_times=3111016 Epoche=4740\n",
      "Epsilon=0.735200 Action_times=3112579 Epoche=4741\n",
      "Epsilon=0.735136 Action_times=3113455 Epoche=4742\n",
      "Epsilon=0.735112 Action_times=3113788 Epoche=4743\n",
      "Epsilon=0.735039 Action_times=3114790 Epoche=4744\n",
      "Epsilon=0.735016 Action_times=3115108 Epoche=4745\n",
      "Epsilon=0.734937 Action_times=3116208 Epoche=4746\n",
      "Epsilon=0.734914 Action_times=3116515 Epoche=4747\n",
      "Epsilon=0.734847 Action_times=3117449 Epoche=4748\n",
      "Epsilon=0.734813 Action_times=3117918 Epoche=4749\n",
      "Epsilon=0.734719 Action_times=3119209 Epoche=4750\n",
      "Epsilon=0.734589 Action_times=3121006 Epoche=4751\n",
      "Epsilon=0.734577 Action_times=3121171 Epoche=4752\n",
      "Epsilon=0.734531 Action_times=3121804 Epoche=4753\n",
      "Epsilon=0.734450 Action_times=3122924 Epoche=4754\n",
      "Epsilon=0.734399 Action_times=3123625 Epoche=4755\n",
      "Epsilon=0.734379 Action_times=3123905 Epoche=4756\n",
      "Epsilon=0.734345 Action_times=3124377 Epoche=4757\n",
      "Epsilon=0.734217 Action_times=3126142 Epoche=4758\n",
      "Epsilon=0.734148 Action_times=3127092 Epoche=4759\n",
      "Epsilon=0.734031 Action_times=3128702 Epoche=4760\n",
      "Epsilon=0.734009 Action_times=3129006 Epoche=4761\n",
      "Epsilon=0.733903 Action_times=3130481 Epoche=4762\n",
      "Epsilon=0.733893 Action_times=3130612 Epoche=4763\n",
      "Epsilon=0.733826 Action_times=3131541 Epoche=4764\n",
      "Epsilon=0.733721 Action_times=3132990 Epoche=4765\n",
      "Epsilon=0.733606 Action_times=3134582 Epoche=4766\n",
      "Epsilon=0.733565 Action_times=3135139 Epoche=4767\n",
      "Epsilon=0.733466 Action_times=3136513 Epoche=4768\n",
      "Epsilon=0.733379 Action_times=3137712 Epoche=4769\n",
      "Epsilon=0.733368 Action_times=3137874 Epoche=4770\n",
      "Epsilon=0.733298 Action_times=3138839 Epoche=4771\n",
      "Epsilon=0.733072 Action_times=3141961 Epoche=4772\n",
      "Epsilon=0.732934 Action_times=3143876 Epoche=4773\n",
      "Epsilon=0.732894 Action_times=3144429 Epoche=4774\n",
      "Epsilon=0.732808 Action_times=3145620 Epoche=4775\n",
      "Epsilon=0.732702 Action_times=3147084 Epoche=4776\n",
      "Epsilon=0.732656 Action_times=3147723 Epoche=4777\n",
      "Epsilon=0.732604 Action_times=3148440 Epoche=4778\n",
      "Epsilon=0.732560 Action_times=3149042 Epoche=4779\n",
      "Epsilon=0.732524 Action_times=3149539 Epoche=4780\n",
      "Epsilon=0.732485 Action_times=3150088 Epoche=4781\n",
      "Epsilon=0.732354 Action_times=3151890 Epoche=4782\n",
      "Epsilon=0.732336 Action_times=3152141 Epoche=4783\n",
      "Epsilon=0.732307 Action_times=3152551 Epoche=4784\n",
      "Epsilon=0.732179 Action_times=3154322 Epoche=4785\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.732100 Action_times=3155416 Epoche=4786\n",
      "Epsilon=0.732009 Action_times=3156674 Epoche=4787\n",
      "Epsilon=0.731983 Action_times=3157040 Epoche=4788\n",
      "Epsilon=0.731893 Action_times=3158280 Epoche=4789\n",
      "Epsilon=0.731793 Action_times=3159668 Epoche=4790\n",
      "Epsilon=0.731694 Action_times=3161044 Epoche=4791\n",
      "Epsilon=0.731644 Action_times=3161736 Epoche=4792\n",
      "Epsilon=0.731523 Action_times=3163409 Epoche=4793\n",
      "Epsilon=0.731507 Action_times=3163630 Epoche=4794\n",
      "Epsilon=0.731470 Action_times=3164147 Epoche=4795\n",
      "Epsilon=0.731387 Action_times=3165287 Epoche=4796\n",
      "Epsilon=0.731254 Action_times=3167139 Epoche=4797\n",
      "Epsilon=0.731210 Action_times=3167743 Epoche=4798\n",
      "Epsilon=0.731154 Action_times=3168516 Epoche=4799\n",
      "Epsilon=0.731035 Action_times=3170178 Epoche=4800\n",
      "Epsilon=0.730866 Action_times=3172513 Epoche=4801\n",
      "Epsilon=0.730854 Action_times=3172684 Epoche=4802\n",
      "Epsilon=0.730713 Action_times=3174638 Epoche=4803\n",
      "Epsilon=0.730545 Action_times=3176965 Epoche=4804\n",
      "Epsilon=0.730423 Action_times=3178658 Epoche=4805\n",
      "Epsilon=0.730340 Action_times=3179822 Epoche=4806\n",
      "Epsilon=0.730316 Action_times=3180154 Epoche=4807\n",
      "Epsilon=0.730266 Action_times=3180842 Epoche=4808\n",
      "Epsilon=0.730136 Action_times=3182653 Epoche=4809\n",
      "Epsilon=0.730095 Action_times=3183224 Epoche=4810\n",
      "Epsilon=0.729979 Action_times=3184823 Epoche=4811\n",
      "Epsilon=0.729911 Action_times=3185768 Epoche=4812\n",
      "Epsilon=0.729890 Action_times=3186064 Epoche=4813\n",
      "Epsilon=0.729815 Action_times=3187104 Epoche=4814\n",
      "Epsilon=0.729761 Action_times=3187864 Epoche=4815\n",
      "Epsilon=0.729752 Action_times=3187982 Epoche=4816\n",
      "Epsilon=0.729691 Action_times=3188833 Epoche=4817\n",
      "Epsilon=0.729623 Action_times=3189776 Epoche=4818\n",
      "Epsilon=0.729550 Action_times=3190791 Epoche=4819\n",
      "Epsilon=0.729495 Action_times=3191555 Epoche=4820\n",
      "Epsilon=0.729392 Action_times=3192982 Epoche=4821\n",
      "Epsilon=0.729281 Action_times=3194528 Epoche=4822\n",
      "Epsilon=0.729158 Action_times=3196235 Epoche=4823\n",
      "Epsilon=0.729064 Action_times=3197542 Epoche=4824\n",
      "Epsilon=0.728994 Action_times=3198523 Epoche=4825\n",
      "Epsilon=0.728826 Action_times=3200850 Epoche=4826\n",
      "Epsilon=0.728712 Action_times=3202448 Epoche=4827\n",
      "Epsilon=0.728684 Action_times=3202826 Epoche=4828\n",
      "Epsilon=0.728654 Action_times=3203245 Epoche=4829\n",
      "Epsilon=0.728591 Action_times=3204128 Epoche=4830\n",
      "Epsilon=0.728562 Action_times=3204533 Epoche=4831\n",
      "Epsilon=0.728522 Action_times=3205082 Epoche=4832\n",
      "Epsilon=0.728480 Action_times=3205677 Epoche=4833\n",
      "Epsilon=0.728340 Action_times=3207618 Epoche=4834\n",
      "Epsilon=0.728317 Action_times=3207936 Epoche=4835\n",
      "Epsilon=0.728195 Action_times=3209642 Epoche=4836\n",
      "Epsilon=0.728114 Action_times=3210772 Epoche=4837\n",
      "Epsilon=0.728047 Action_times=3211703 Epoche=4838\n",
      "Epsilon=0.727864 Action_times=3214245 Epoche=4839\n",
      "Epsilon=0.727798 Action_times=3215167 Epoche=4840\n",
      "Epsilon=0.727746 Action_times=3215886 Epoche=4841\n",
      "Epsilon=0.727619 Action_times=3217667 Epoche=4842\n",
      "Epsilon=0.727543 Action_times=3218725 Epoche=4843\n",
      "Epsilon=0.727452 Action_times=3219989 Epoche=4844\n",
      "Epsilon=0.727414 Action_times=3220515 Epoche=4845\n",
      "Epsilon=0.727346 Action_times=3221460 Epoche=4846\n",
      "Epsilon=0.727253 Action_times=3222760 Epoche=4847\n",
      "Epsilon=0.727206 Action_times=3223413 Epoche=4848\n",
      "Epsilon=0.727141 Action_times=3224326 Epoche=4849\n",
      "Epsilon=0.727098 Action_times=3224923 Epoche=4850\n",
      "Epsilon=0.727023 Action_times=3225977 Epoche=4851\n",
      "Epsilon=0.726948 Action_times=3227012 Epoche=4852\n",
      "Epsilon=0.726796 Action_times=3229132 Epoche=4853\n",
      "Epsilon=0.726664 Action_times=3230977 Epoche=4854\n",
      "Epsilon=0.726579 Action_times=3232162 Epoche=4855\n",
      "Epsilon=0.726482 Action_times=3233517 Epoche=4856\n",
      "Epsilon=0.726461 Action_times=3233818 Epoche=4857\n",
      "Epsilon=0.726358 Action_times=3235254 Epoche=4858\n",
      "Epsilon=0.726249 Action_times=3236774 Epoche=4859\n",
      "Epsilon=0.726119 Action_times=3238587 Epoche=4860\n",
      "Epsilon=0.726049 Action_times=3239563 Epoche=4861\n",
      "Epsilon=0.725951 Action_times=3240937 Epoche=4862\n",
      "Epsilon=0.725888 Action_times=3241817 Epoche=4863\n",
      "Epsilon=0.725784 Action_times=3243263 Epoche=4864\n",
      "Epsilon=0.725648 Action_times=3245167 Epoche=4865\n",
      "Epsilon=0.725533 Action_times=3246773 Epoche=4866\n",
      "Epsilon=0.725431 Action_times=3248196 Epoche=4867\n",
      "Epsilon=0.725376 Action_times=3248963 Epoche=4868\n",
      "Epsilon=0.725262 Action_times=3250566 Epoche=4869\n",
      "Epsilon=0.725151 Action_times=3252111 Epoche=4870\n",
      "Epsilon=0.725048 Action_times=3253559 Epoche=4871\n",
      "Epsilon=0.724941 Action_times=3255051 Epoche=4872\n",
      "Epsilon=0.724903 Action_times=3255574 Epoche=4873\n",
      "Epsilon=0.724876 Action_times=3255956 Epoche=4874\n",
      "Epsilon=0.724618 Action_times=3259564 Epoche=4875\n",
      "Epsilon=0.724479 Action_times=3261516 Epoche=4876\n",
      "Epsilon=0.724415 Action_times=3262415 Epoche=4877\n",
      "Epsilon=0.724302 Action_times=3263988 Epoche=4878\n",
      "Epsilon=0.724282 Action_times=3264269 Epoche=4879\n",
      "Epsilon=0.724171 Action_times=3265831 Epoche=4880\n",
      "Epsilon=0.724126 Action_times=3266460 Epoche=4881\n",
      "Epsilon=0.724032 Action_times=3267769 Epoche=4882\n",
      "Epsilon=0.723919 Action_times=3269360 Epoche=4883\n",
      "Epsilon=0.723798 Action_times=3271053 Epoche=4884\n",
      "Epsilon=0.723761 Action_times=3271568 Epoche=4885\n",
      "Epsilon=0.723710 Action_times=3272281 Epoche=4886\n",
      "Epsilon=0.723559 Action_times=3274398 Epoche=4887\n",
      "Epsilon=0.723506 Action_times=3275139 Epoche=4888\n",
      "Epsilon=0.723459 Action_times=3275804 Epoche=4889\n",
      "Epsilon=0.723444 Action_times=3276004 Epoche=4890\n",
      "Epsilon=0.723376 Action_times=3276960 Epoche=4891\n",
      "Epsilon=0.723231 Action_times=3278994 Epoche=4892\n",
      "Epsilon=0.723149 Action_times=3280149 Epoche=4893\n",
      "Epsilon=0.723078 Action_times=3281140 Epoche=4894\n",
      "Epsilon=0.723056 Action_times=3281450 Epoche=4895\n",
      "Epsilon=0.722979 Action_times=3282526 Epoche=4896\n",
      "Epsilon=0.722974 Action_times=3282598 Epoche=4897\n",
      "Epsilon=0.722909 Action_times=3283509 Epoche=4898\n",
      "Epsilon=0.722820 Action_times=3284765 Epoche=4899\n",
      "Epsilon=0.722808 Action_times=3284928 Epoche=4900\n",
      "Epsilon=0.722769 Action_times=3285472 Epoche=4901\n",
      "Epsilon=0.722690 Action_times=3286577 Epoche=4902\n",
      "Epsilon=0.722654 Action_times=3287093 Epoche=4903\n",
      "Epsilon=0.722546 Action_times=3288603 Epoche=4904\n",
      "Epsilon=0.722382 Action_times=3290911 Epoche=4905\n",
      "Epsilon=0.722332 Action_times=3291613 Epoche=4906\n",
      "Epsilon=0.722247 Action_times=3292800 Epoche=4907\n",
      "Epsilon=0.722244 Action_times=3292847 Epoche=4908\n",
      "Epsilon=0.722183 Action_times=3293703 Epoche=4909\n",
      "Epsilon=0.722154 Action_times=3294109 Epoche=4910\n",
      "Epsilon=0.722066 Action_times=3295337 Epoche=4911\n",
      "Epsilon=0.722012 Action_times=3296105 Epoche=4912\n",
      "Epsilon=0.721942 Action_times=3297083 Epoche=4913\n",
      "Epsilon=0.721845 Action_times=3298450 Epoche=4914\n",
      "Epsilon=0.721789 Action_times=3299240 Epoche=4915\n",
      "Epsilon=0.721746 Action_times=3299840 Epoche=4916\n",
      "Epsilon=0.721694 Action_times=3300573 Epoche=4917\n",
      "Epsilon=0.721653 Action_times=3301145 Epoche=4918\n",
      "Epsilon=0.721589 Action_times=3302039 Epoche=4919\n",
      "Epsilon=0.721580 Action_times=3302174 Epoche=4920\n",
      "Epsilon=0.721504 Action_times=3303238 Epoche=4921\n",
      "Epsilon=0.721417 Action_times=3304464 Epoche=4922\n",
      "Epsilon=0.721409 Action_times=3304577 Epoche=4923\n",
      "Epsilon=0.721387 Action_times=3304881 Epoche=4924\n",
      "Epsilon=0.721362 Action_times=3305241 Epoche=4925\n",
      "Epsilon=0.721248 Action_times=3306840 Epoche=4926\n",
      "Epsilon=0.721111 Action_times=3308767 Epoche=4927\n",
      "Epsilon=0.721053 Action_times=3309579 Epoche=4928\n",
      "Epsilon=0.721004 Action_times=3310268 Epoche=4929\n",
      "Epsilon=0.720903 Action_times=3311683 Epoche=4930\n",
      "Epsilon=0.720888 Action_times=3311894 Epoche=4931\n",
      "Epsilon=0.720781 Action_times=3313409 Epoche=4932\n",
      "Epsilon=0.720658 Action_times=3315135 Epoche=4933\n",
      "Epsilon=0.720617 Action_times=3315720 Epoche=4934\n",
      "Epsilon=0.720592 Action_times=3316072 Epoche=4935\n",
      "Epsilon=0.720485 Action_times=3317571 Epoche=4936\n",
      "Epsilon=0.720421 Action_times=3318474 Epoche=4937\n",
      "Epsilon=0.720354 Action_times=3319415 Epoche=4938\n",
      "Epsilon=0.720311 Action_times=3320027 Epoche=4939\n",
      "Epsilon=0.720131 Action_times=3322554 Epoche=4940\n",
      "Epsilon=0.720065 Action_times=3323490 Epoche=4941\n",
      "Epsilon=0.719939 Action_times=3325256 Epoche=4942\n",
      "Epsilon=0.719854 Action_times=3326460 Epoche=4943\n",
      "Epsilon=0.719744 Action_times=3328003 Epoche=4944\n",
      "Epsilon=0.719647 Action_times=3329366 Epoche=4945\n",
      "Epsilon=0.719595 Action_times=3330105 Epoche=4946\n",
      "Epsilon=0.719501 Action_times=3331432 Epoche=4947\n",
      "Epsilon=0.719436 Action_times=3332350 Epoche=4948\n",
      "Epsilon=0.719317 Action_times=3334026 Epoche=4949\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.719232 Action_times=3335229 Epoche=4950\n",
      "Epsilon=0.719206 Action_times=3335584 Epoche=4951\n",
      "Epsilon=0.719132 Action_times=3336634 Epoche=4952\n",
      "Epsilon=0.719041 Action_times=3337920 Epoche=4953\n",
      "Epsilon=0.719027 Action_times=3338115 Epoche=4954\n",
      "Epsilon=0.718946 Action_times=3339260 Epoche=4955\n",
      "Epsilon=0.718888 Action_times=3340077 Epoche=4956\n",
      "Epsilon=0.718825 Action_times=3340967 Epoche=4957\n",
      "Epsilon=0.718789 Action_times=3341467 Epoche=4958\n",
      "Epsilon=0.718762 Action_times=3341857 Epoche=4959\n",
      "Epsilon=0.718663 Action_times=3343244 Epoche=4960\n",
      "Epsilon=0.718627 Action_times=3343763 Epoche=4961\n",
      "Epsilon=0.718524 Action_times=3345205 Epoche=4962\n",
      "Epsilon=0.718477 Action_times=3345875 Epoche=4963\n",
      "Epsilon=0.718400 Action_times=3346962 Epoche=4964\n",
      "Epsilon=0.718336 Action_times=3347869 Epoche=4965\n",
      "Epsilon=0.718257 Action_times=3348980 Epoche=4966\n",
      "Epsilon=0.718127 Action_times=3350821 Epoche=4967\n",
      "Epsilon=0.718068 Action_times=3351653 Epoche=4968\n",
      "Epsilon=0.718021 Action_times=3352314 Epoche=4969\n",
      "Epsilon=0.717923 Action_times=3353690 Epoche=4970\n",
      "Epsilon=0.717865 Action_times=3354514 Epoche=4971\n",
      "Epsilon=0.717739 Action_times=3356289 Epoche=4972\n",
      "Epsilon=0.717598 Action_times=3358291 Epoche=4973\n",
      "Epsilon=0.717510 Action_times=3359532 Epoche=4974\n",
      "Epsilon=0.717401 Action_times=3361073 Epoche=4975\n",
      "Epsilon=0.717367 Action_times=3361552 Epoche=4976\n",
      "Epsilon=0.717267 Action_times=3362968 Epoche=4977\n",
      "Epsilon=0.717164 Action_times=3364430 Epoche=4978\n",
      "Epsilon=0.717123 Action_times=3365008 Epoche=4979\n",
      "Epsilon=0.717096 Action_times=3365380 Epoche=4980\n",
      "Epsilon=0.717042 Action_times=3366149 Epoche=4981\n",
      "Epsilon=0.716977 Action_times=3367064 Epoche=4982\n",
      "Epsilon=0.716887 Action_times=3368345 Epoche=4983\n",
      "Epsilon=0.716882 Action_times=3368410 Epoche=4984\n",
      "Epsilon=0.716805 Action_times=3369501 Epoche=4985\n",
      "Epsilon=0.716757 Action_times=3370185 Epoche=4986\n",
      "Epsilon=0.716703 Action_times=3370943 Epoche=4987\n",
      "Epsilon=0.716638 Action_times=3371869 Epoche=4988\n",
      "Epsilon=0.716517 Action_times=3373581 Epoche=4989\n",
      "Epsilon=0.716346 Action_times=3375999 Epoche=4990\n",
      "Epsilon=0.716229 Action_times=3377658 Epoche=4991\n",
      "Epsilon=0.716181 Action_times=3378339 Epoche=4992\n",
      "Epsilon=0.716145 Action_times=3378846 Epoche=4993\n",
      "Epsilon=0.716005 Action_times=3380825 Epoche=4994\n",
      "Epsilon=0.715956 Action_times=3381518 Epoche=4995\n",
      "Epsilon=0.715843 Action_times=3383117 Epoche=4996\n",
      "Epsilon=0.715771 Action_times=3384140 Epoche=4997\n",
      "Epsilon=0.715668 Action_times=3385596 Epoche=4998\n",
      "Epsilon=0.715641 Action_times=3385989 Epoche=4999\n",
      "Epsilon=0.715507 Action_times=3387881 Epoche=5000\n",
      "Epsilon=0.715503 Action_times=3387940 Epoche=5001\n",
      "Epsilon=0.715413 Action_times=3389214 Epoche=5002\n",
      "Epsilon=0.715320 Action_times=3390533 Epoche=5003\n",
      "Epsilon=0.715252 Action_times=3391496 Epoche=5004\n",
      "Epsilon=0.715143 Action_times=3393045 Epoche=5005\n",
      "Epsilon=0.715124 Action_times=3393313 Epoche=5006\n",
      "Epsilon=0.715078 Action_times=3393960 Epoche=5007\n",
      "Epsilon=0.715042 Action_times=3394471 Epoche=5008\n",
      "Epsilon=0.714945 Action_times=3395851 Epoche=5009\n",
      "Epsilon=0.714870 Action_times=3396909 Epoche=5010\n",
      "Epsilon=0.714824 Action_times=3397569 Epoche=5011\n",
      "Epsilon=0.714751 Action_times=3398601 Epoche=5012\n",
      "Epsilon=0.714629 Action_times=3400337 Epoche=5013\n",
      "Epsilon=0.714544 Action_times=3401541 Epoche=5014\n",
      "Epsilon=0.714412 Action_times=3403415 Epoche=5015\n",
      "Epsilon=0.714262 Action_times=3405539 Epoche=5016\n",
      "Epsilon=0.714165 Action_times=3406924 Epoche=5017\n",
      "Epsilon=0.714106 Action_times=3407761 Epoche=5018\n",
      "Epsilon=0.713990 Action_times=3409401 Epoche=5019\n",
      "Epsilon=0.713942 Action_times=3410095 Epoche=5020\n",
      "Epsilon=0.713847 Action_times=3411440 Epoche=5021\n",
      "Epsilon=0.713802 Action_times=3412081 Epoche=5022\n",
      "Epsilon=0.713765 Action_times=3412604 Epoche=5023\n",
      "Epsilon=0.713694 Action_times=3413620 Epoche=5024\n",
      "Epsilon=0.713627 Action_times=3414570 Epoche=5025\n",
      "Epsilon=0.713460 Action_times=3416943 Epoche=5026\n",
      "Epsilon=0.713373 Action_times=3418169 Epoche=5027\n",
      "Epsilon=0.713277 Action_times=3419548 Epoche=5028\n",
      "Epsilon=0.713124 Action_times=3421713 Epoche=5029\n",
      "Epsilon=0.713057 Action_times=3422664 Epoche=5030\n",
      "Epsilon=0.712878 Action_times=3425215 Epoche=5031\n",
      "Epsilon=0.712821 Action_times=3426030 Epoche=5032\n",
      "Epsilon=0.712780 Action_times=3426609 Epoche=5033\n",
      "Epsilon=0.712634 Action_times=3428687 Epoche=5034\n",
      "Epsilon=0.712501 Action_times=3430578 Epoche=5035\n",
      "Epsilon=0.712464 Action_times=3431109 Epoche=5036\n",
      "Epsilon=0.712387 Action_times=3432200 Epoche=5037\n",
      "Epsilon=0.712340 Action_times=3432875 Epoche=5038\n",
      "Epsilon=0.712236 Action_times=3434360 Epoche=5039\n",
      "Epsilon=0.712181 Action_times=3435144 Epoche=5040\n",
      "Epsilon=0.712134 Action_times=3435809 Epoche=5041\n",
      "Epsilon=0.712075 Action_times=3436642 Epoche=5042\n",
      "Epsilon=0.711982 Action_times=3437973 Epoche=5043\n",
      "Epsilon=0.711940 Action_times=3438576 Epoche=5044\n",
      "Epsilon=0.711882 Action_times=3439394 Epoche=5045\n",
      "Epsilon=0.711796 Action_times=3440622 Epoche=5046\n",
      "Epsilon=0.711706 Action_times=3441903 Epoche=5047\n",
      "Epsilon=0.711664 Action_times=3442503 Epoche=5048\n",
      "Epsilon=0.711610 Action_times=3443277 Epoche=5049\n",
      "Epsilon=0.711532 Action_times=3444383 Epoche=5050\n",
      "Epsilon=0.711355 Action_times=3446913 Epoche=5051\n",
      "Epsilon=0.711240 Action_times=3448541 Epoche=5052\n",
      "Epsilon=0.711146 Action_times=3449894 Epoche=5053\n",
      "Epsilon=0.711077 Action_times=3450870 Epoche=5054\n",
      "Epsilon=0.711060 Action_times=3451120 Epoche=5055\n",
      "Epsilon=0.710963 Action_times=3452503 Epoche=5056\n",
      "Epsilon=0.710878 Action_times=3453715 Epoche=5057\n",
      "Epsilon=0.710793 Action_times=3454919 Epoche=5058\n",
      "Epsilon=0.710702 Action_times=3456223 Epoche=5059\n",
      "Epsilon=0.710539 Action_times=3458553 Epoche=5060\n",
      "Epsilon=0.710475 Action_times=3459461 Epoche=5061\n",
      "Epsilon=0.710409 Action_times=3460401 Epoche=5062\n",
      "Epsilon=0.710336 Action_times=3461454 Epoche=5063\n",
      "Epsilon=0.710210 Action_times=3463243 Epoche=5064\n",
      "Epsilon=0.710153 Action_times=3464065 Epoche=5065\n",
      "Epsilon=0.710071 Action_times=3465236 Epoche=5066\n",
      "Epsilon=0.709984 Action_times=3466479 Epoche=5067\n",
      "Epsilon=0.709929 Action_times=3467264 Epoche=5068\n",
      "Epsilon=0.709888 Action_times=3467848 Epoche=5069\n",
      "Epsilon=0.709774 Action_times=3469482 Epoche=5070\n",
      "Epsilon=0.709703 Action_times=3470485 Epoche=5071\n",
      "Epsilon=0.709617 Action_times=3471719 Epoche=5072\n",
      "Epsilon=0.709546 Action_times=3472733 Epoche=5073\n",
      "Epsilon=0.709453 Action_times=3474061 Epoche=5074\n",
      "Epsilon=0.709414 Action_times=3474618 Epoche=5075\n",
      "Epsilon=0.709325 Action_times=3475895 Epoche=5076\n",
      "Epsilon=0.709233 Action_times=3477204 Epoche=5077\n",
      "Epsilon=0.709168 Action_times=3478144 Epoche=5078\n",
      "Epsilon=0.709151 Action_times=3478389 Epoche=5079\n",
      "Epsilon=0.709133 Action_times=3478646 Epoche=5080\n",
      "Epsilon=0.709049 Action_times=3479839 Epoche=5081\n",
      "Epsilon=0.708922 Action_times=3481653 Epoche=5082\n",
      "Epsilon=0.708855 Action_times=3482612 Epoche=5083\n",
      "Epsilon=0.708730 Action_times=3484408 Epoche=5084\n",
      "Epsilon=0.708708 Action_times=3484726 Epoche=5085\n",
      "Epsilon=0.708588 Action_times=3486431 Epoche=5086\n",
      "Epsilon=0.708504 Action_times=3487646 Epoche=5087\n",
      "Epsilon=0.708449 Action_times=3488427 Epoche=5088\n",
      "Epsilon=0.708377 Action_times=3489456 Epoche=5089\n",
      "Epsilon=0.708333 Action_times=3490084 Epoche=5090\n",
      "Epsilon=0.708199 Action_times=3492003 Epoche=5091\n",
      "Epsilon=0.708079 Action_times=3493730 Epoche=5092\n",
      "Epsilon=0.708048 Action_times=3494177 Epoche=5093\n",
      "Epsilon=0.708006 Action_times=3494779 Epoche=5094\n",
      "Epsilon=0.707961 Action_times=3495417 Epoche=5095\n",
      "Epsilon=0.707887 Action_times=3496480 Epoche=5096\n",
      "Epsilon=0.707793 Action_times=3497818 Epoche=5097\n",
      "Epsilon=0.707730 Action_times=3498728 Epoche=5098\n",
      "Epsilon=0.707631 Action_times=3500147 Epoche=5099\n",
      "Epsilon=0.707600 Action_times=3500595 Epoche=5100\n",
      "Epsilon=0.707507 Action_times=3501917 Epoche=5101\n",
      "Epsilon=0.707422 Action_times=3503139 Epoche=5102\n",
      "Epsilon=0.707376 Action_times=3503796 Epoche=5103\n",
      "Epsilon=0.707273 Action_times=3505273 Epoche=5104\n",
      "Epsilon=0.707171 Action_times=3506736 Epoche=5105\n",
      "Epsilon=0.707071 Action_times=3508172 Epoche=5106\n",
      "Epsilon=0.706935 Action_times=3510123 Epoche=5107\n",
      "Epsilon=0.706798 Action_times=3512095 Epoche=5108\n",
      "Epsilon=0.706750 Action_times=3512776 Epoche=5109\n",
      "Epsilon=0.706588 Action_times=3515105 Epoche=5110\n",
      "Epsilon=0.706536 Action_times=3515850 Epoche=5111\n",
      "Epsilon=0.706416 Action_times=3517573 Epoche=5112\n",
      "Epsilon=0.706328 Action_times=3518840 Epoche=5113\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.706242 Action_times=3520071 Epoche=5114\n",
      "Epsilon=0.706162 Action_times=3521232 Epoche=5115\n",
      "Epsilon=0.706091 Action_times=3522243 Epoche=5116\n",
      "Epsilon=0.706053 Action_times=3522787 Epoche=5117\n",
      "Epsilon=0.706008 Action_times=3523434 Epoche=5118\n",
      "Epsilon=0.705952 Action_times=3524240 Epoche=5119\n",
      "Epsilon=0.705883 Action_times=3525235 Epoche=5120\n",
      "Epsilon=0.705824 Action_times=3526089 Epoche=5121\n",
      "Epsilon=0.705790 Action_times=3526572 Epoche=5122\n",
      "Epsilon=0.705728 Action_times=3527459 Epoche=5123\n",
      "Epsilon=0.705665 Action_times=3528369 Epoche=5124\n",
      "Epsilon=0.705596 Action_times=3529366 Epoche=5125\n",
      "Epsilon=0.705587 Action_times=3529485 Epoche=5126\n",
      "Epsilon=0.705567 Action_times=3529772 Epoche=5127\n",
      "Epsilon=0.705544 Action_times=3530110 Epoche=5128\n",
      "Epsilon=0.705484 Action_times=3530967 Epoche=5129\n",
      "Epsilon=0.705358 Action_times=3532777 Epoche=5130\n",
      "Epsilon=0.705351 Action_times=3532883 Epoche=5131\n",
      "Epsilon=0.705315 Action_times=3533395 Epoche=5132\n",
      "Epsilon=0.705254 Action_times=3534270 Epoche=5133\n",
      "Epsilon=0.705249 Action_times=3534343 Epoche=5134\n",
      "Epsilon=0.705196 Action_times=3535110 Epoche=5135\n",
      "Epsilon=0.705122 Action_times=3536174 Epoche=5136\n",
      "Epsilon=0.705074 Action_times=3536867 Epoche=5137\n",
      "Epsilon=0.704989 Action_times=3538089 Epoche=5138\n",
      "Epsilon=0.704928 Action_times=3538964 Epoche=5139\n",
      "Epsilon=0.704833 Action_times=3540341 Epoche=5140\n",
      "Epsilon=0.704740 Action_times=3541672 Epoche=5141\n",
      "Epsilon=0.704623 Action_times=3543356 Epoche=5142\n",
      "Epsilon=0.704579 Action_times=3543989 Epoche=5143\n",
      "Epsilon=0.704539 Action_times=3544562 Epoche=5144\n",
      "Epsilon=0.704504 Action_times=3545064 Epoche=5145\n",
      "Epsilon=0.704456 Action_times=3545756 Epoche=5146\n",
      "Epsilon=0.704432 Action_times=3546111 Epoche=5147\n",
      "Epsilon=0.704399 Action_times=3546581 Epoche=5148\n",
      "Epsilon=0.704242 Action_times=3548849 Epoche=5149\n",
      "Epsilon=0.704212 Action_times=3549282 Epoche=5150\n",
      "Epsilon=0.704122 Action_times=3550574 Epoche=5151\n",
      "Epsilon=0.703944 Action_times=3553140 Epoche=5152\n",
      "Epsilon=0.703916 Action_times=3553539 Epoche=5153\n",
      "Epsilon=0.703734 Action_times=3556169 Epoche=5154\n",
      "Epsilon=0.703689 Action_times=3556816 Epoche=5155\n",
      "Epsilon=0.703529 Action_times=3559119 Epoche=5156\n",
      "Epsilon=0.703347 Action_times=3561741 Epoche=5157\n",
      "Epsilon=0.703269 Action_times=3562872 Epoche=5158\n",
      "Epsilon=0.703194 Action_times=3563956 Epoche=5159\n",
      "Epsilon=0.703104 Action_times=3565251 Epoche=5160\n",
      "Epsilon=0.703009 Action_times=3566613 Epoche=5161\n",
      "Epsilon=0.702916 Action_times=3567955 Epoche=5162\n",
      "Epsilon=0.702840 Action_times=3569054 Epoche=5163\n",
      "Epsilon=0.702790 Action_times=3569774 Epoche=5164\n",
      "Epsilon=0.702778 Action_times=3569955 Epoche=5165\n",
      "Epsilon=0.702727 Action_times=3570683 Epoche=5166\n",
      "Epsilon=0.702647 Action_times=3571839 Epoche=5167\n",
      "Epsilon=0.702629 Action_times=3572106 Epoche=5168\n",
      "Epsilon=0.702540 Action_times=3573396 Epoche=5169\n",
      "Epsilon=0.702523 Action_times=3573631 Epoche=5170\n",
      "Epsilon=0.702454 Action_times=3574630 Epoche=5171\n",
      "Epsilon=0.702410 Action_times=3575268 Epoche=5172\n",
      "Epsilon=0.702213 Action_times=3578109 Epoche=5173\n",
      "Epsilon=0.702166 Action_times=3578798 Epoche=5174\n",
      "Epsilon=0.702043 Action_times=3580562 Epoche=5175\n",
      "Epsilon=0.702032 Action_times=3580729 Epoche=5176\n",
      "Epsilon=0.701991 Action_times=3581320 Epoche=5177\n",
      "Epsilon=0.701952 Action_times=3581877 Epoche=5178\n",
      "Epsilon=0.701877 Action_times=3582968 Epoche=5179\n",
      "Epsilon=0.701785 Action_times=3584298 Epoche=5180\n",
      "Epsilon=0.701732 Action_times=3585061 Epoche=5181\n",
      "Epsilon=0.701713 Action_times=3585341 Epoche=5182\n",
      "Epsilon=0.701648 Action_times=3586277 Epoche=5183\n",
      "Epsilon=0.701619 Action_times=3586697 Epoche=5184\n",
      "Epsilon=0.701469 Action_times=3588872 Epoche=5185\n",
      "Epsilon=0.701354 Action_times=3590525 Epoche=5186\n",
      "Epsilon=0.701298 Action_times=3591337 Epoche=5187\n",
      "Epsilon=0.701262 Action_times=3591857 Epoche=5188\n",
      "Epsilon=0.701233 Action_times=3592277 Epoche=5189\n",
      "Epsilon=0.701133 Action_times=3593725 Epoche=5190\n",
      "Epsilon=0.701018 Action_times=3595385 Epoche=5191\n",
      "Epsilon=0.700898 Action_times=3597132 Epoche=5192\n",
      "Epsilon=0.700866 Action_times=3597588 Epoche=5193\n",
      "Epsilon=0.700782 Action_times=3598801 Epoche=5194\n",
      "Epsilon=0.700731 Action_times=3599552 Epoche=5195\n",
      "Epsilon=0.700620 Action_times=3601149 Epoche=5196\n",
      "Epsilon=0.700435 Action_times=3603826 Epoche=5197\n",
      "Epsilon=0.700317 Action_times=3605539 Epoche=5198\n",
      "Epsilon=0.700222 Action_times=3606914 Epoche=5199\n",
      "Epsilon=0.700149 Action_times=3607974 Epoche=5200\n",
      "Epsilon=0.700037 Action_times=3609599 Epoche=5201\n",
      "Epsilon=0.700006 Action_times=3610052 Epoche=5202\n",
      "Epsilon=0.699972 Action_times=3610541 Epoche=5203\n",
      "Epsilon=0.699894 Action_times=3611668 Epoche=5204\n",
      "Epsilon=0.699879 Action_times=3611887 Epoche=5205\n",
      "Epsilon=0.699848 Action_times=3612339 Epoche=5206\n",
      "Epsilon=0.699755 Action_times=3613680 Epoche=5207\n",
      "Epsilon=0.699668 Action_times=3614948 Epoche=5208\n",
      "Epsilon=0.699567 Action_times=3616415 Epoche=5209\n",
      "Epsilon=0.699530 Action_times=3616941 Epoche=5210\n",
      "Epsilon=0.699454 Action_times=3618055 Epoche=5211\n",
      "Epsilon=0.699351 Action_times=3619547 Epoche=5212\n",
      "Epsilon=0.699263 Action_times=3620819 Epoche=5213\n",
      "Epsilon=0.699158 Action_times=3622346 Epoche=5214\n",
      "Epsilon=0.699059 Action_times=3623782 Epoche=5215\n",
      "Epsilon=0.698904 Action_times=3626027 Epoche=5216\n",
      "Epsilon=0.698877 Action_times=3626429 Epoche=5217\n",
      "Epsilon=0.698774 Action_times=3627920 Epoche=5218\n",
      "Epsilon=0.698566 Action_times=3630931 Epoche=5219\n",
      "Epsilon=0.698485 Action_times=3632110 Epoche=5220\n",
      "Epsilon=0.698445 Action_times=3632695 Epoche=5221\n",
      "Epsilon=0.698439 Action_times=3632780 Epoche=5222\n",
      "Epsilon=0.698329 Action_times=3634382 Epoche=5223\n",
      "Epsilon=0.698057 Action_times=3638333 Epoche=5224\n",
      "Epsilon=0.697877 Action_times=3640948 Epoche=5225\n",
      "Epsilon=0.697795 Action_times=3642148 Epoche=5226\n",
      "Epsilon=0.697749 Action_times=3642816 Epoche=5227\n",
      "Epsilon=0.697672 Action_times=3643924 Epoche=5228\n",
      "Epsilon=0.697644 Action_times=3644340 Epoche=5229\n",
      "Epsilon=0.697457 Action_times=3647054 Epoche=5230\n",
      "Epsilon=0.697284 Action_times=3649576 Epoche=5231\n",
      "Epsilon=0.697275 Action_times=3649706 Epoche=5232\n",
      "Epsilon=0.697112 Action_times=3652080 Epoche=5233\n",
      "Epsilon=0.696922 Action_times=3654842 Epoche=5234\n",
      "Epsilon=0.696805 Action_times=3656542 Epoche=5235\n",
      "Epsilon=0.696753 Action_times=3657296 Epoche=5236\n",
      "Epsilon=0.696707 Action_times=3657978 Epoche=5237\n",
      "Epsilon=0.696656 Action_times=3658713 Epoche=5238\n",
      "Epsilon=0.696557 Action_times=3660163 Epoche=5239\n",
      "Epsilon=0.696513 Action_times=3660803 Epoche=5240\n",
      "Epsilon=0.696408 Action_times=3662327 Epoche=5241\n",
      "Epsilon=0.696381 Action_times=3662728 Epoche=5242\n",
      "Epsilon=0.696268 Action_times=3664372 Epoche=5243\n",
      "Epsilon=0.696258 Action_times=3664508 Epoche=5244\n",
      "Epsilon=0.696161 Action_times=3665920 Epoche=5245\n",
      "Epsilon=0.696069 Action_times=3667274 Epoche=5246\n",
      "Epsilon=0.696007 Action_times=3668178 Epoche=5247\n",
      "Epsilon=0.695978 Action_times=3668601 Epoche=5248\n",
      "Epsilon=0.695947 Action_times=3669044 Epoche=5249\n",
      "Epsilon=0.695871 Action_times=3670155 Epoche=5250\n",
      "Epsilon=0.695784 Action_times=3671423 Epoche=5251\n",
      "Epsilon=0.695701 Action_times=3672631 Epoche=5252\n",
      "Epsilon=0.695651 Action_times=3673362 Epoche=5253\n",
      "Epsilon=0.695586 Action_times=3674317 Epoche=5254\n",
      "Epsilon=0.695508 Action_times=3675448 Epoche=5255\n",
      "Epsilon=0.695457 Action_times=3676196 Epoche=5256\n",
      "Epsilon=0.695403 Action_times=3676975 Epoche=5257\n",
      "Epsilon=0.695272 Action_times=3678897 Epoche=5258\n",
      "Epsilon=0.695232 Action_times=3679478 Epoche=5259\n",
      "Epsilon=0.695186 Action_times=3680146 Epoche=5260\n",
      "Epsilon=0.695118 Action_times=3681133 Epoche=5261\n",
      "Epsilon=0.694948 Action_times=3683617 Epoche=5262\n",
      "Epsilon=0.694927 Action_times=3683921 Epoche=5263\n",
      "Epsilon=0.694877 Action_times=3684664 Epoche=5264\n",
      "Epsilon=0.694773 Action_times=3686171 Epoche=5265\n",
      "Epsilon=0.694694 Action_times=3687324 Epoche=5266\n",
      "Epsilon=0.694661 Action_times=3687816 Epoche=5267\n",
      "Epsilon=0.694624 Action_times=3688348 Epoche=5268\n",
      "Epsilon=0.694587 Action_times=3688891 Epoche=5269\n",
      "Epsilon=0.694582 Action_times=3688962 Epoche=5270\n",
      "Epsilon=0.694558 Action_times=3689309 Epoche=5271\n",
      "Epsilon=0.694535 Action_times=3689648 Epoche=5272\n",
      "Epsilon=0.694501 Action_times=3690155 Epoche=5273\n",
      "Epsilon=0.694398 Action_times=3691649 Epoche=5274\n",
      "Epsilon=0.694307 Action_times=3692980 Epoche=5275\n",
      "Epsilon=0.694275 Action_times=3693453 Epoche=5276\n",
      "Epsilon=0.694173 Action_times=3694946 Epoche=5277\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.694130 Action_times=3695569 Epoche=5278\n",
      "Epsilon=0.694034 Action_times=3696973 Epoche=5279\n",
      "Epsilon=0.694012 Action_times=3697295 Epoche=5280\n",
      "Epsilon=0.693992 Action_times=3697590 Epoche=5281\n",
      "Epsilon=0.693962 Action_times=3698033 Epoche=5282\n",
      "Epsilon=0.693845 Action_times=3699743 Epoche=5283\n",
      "Epsilon=0.693708 Action_times=3701743 Epoche=5284\n",
      "Epsilon=0.693615 Action_times=3703101 Epoche=5285\n",
      "Epsilon=0.693593 Action_times=3703418 Epoche=5286\n",
      "Epsilon=0.693542 Action_times=3704174 Epoche=5287\n",
      "Epsilon=0.693410 Action_times=3706104 Epoche=5288\n",
      "Epsilon=0.693216 Action_times=3708939 Epoche=5289\n",
      "Epsilon=0.693132 Action_times=3710173 Epoche=5290\n",
      "Epsilon=0.693066 Action_times=3711129 Epoche=5291\n",
      "Epsilon=0.693046 Action_times=3711424 Epoche=5292\n",
      "Epsilon=0.692967 Action_times=3712577 Epoche=5293\n",
      "Epsilon=0.692943 Action_times=3712931 Epoche=5294\n",
      "Epsilon=0.692933 Action_times=3713086 Epoche=5295\n",
      "Epsilon=0.692829 Action_times=3714602 Epoche=5296\n",
      "Epsilon=0.692726 Action_times=3716116 Epoche=5297\n",
      "Epsilon=0.692665 Action_times=3717012 Epoche=5298\n",
      "Epsilon=0.692614 Action_times=3717760 Epoche=5299\n",
      "Epsilon=0.692539 Action_times=3718852 Epoche=5300\n",
      "Epsilon=0.692499 Action_times=3719446 Epoche=5301\n",
      "Epsilon=0.692401 Action_times=3720875 Epoche=5302\n",
      "Epsilon=0.692341 Action_times=3721751 Epoche=5303\n",
      "Epsilon=0.692271 Action_times=3722774 Epoche=5304\n",
      "Epsilon=0.692234 Action_times=3723328 Epoche=5305\n",
      "Epsilon=0.692151 Action_times=3724532 Epoche=5306\n",
      "Epsilon=0.692062 Action_times=3725838 Epoche=5307\n",
      "Epsilon=0.691892 Action_times=3728336 Epoche=5308\n",
      "Epsilon=0.691781 Action_times=3729964 Epoche=5309\n",
      "Epsilon=0.691594 Action_times=3732709 Epoche=5310\n",
      "Epsilon=0.691500 Action_times=3734085 Epoche=5311\n",
      "Epsilon=0.691439 Action_times=3734985 Epoche=5312\n",
      "Epsilon=0.691346 Action_times=3736343 Epoche=5313\n",
      "Epsilon=0.691295 Action_times=3737090 Epoche=5314\n",
      "Epsilon=0.691290 Action_times=3737176 Epoche=5315\n",
      "Epsilon=0.691243 Action_times=3737854 Epoche=5316\n",
      "Epsilon=0.691123 Action_times=3739625 Epoche=5317\n",
      "Epsilon=0.691096 Action_times=3740017 Epoche=5318\n",
      "Epsilon=0.691061 Action_times=3740532 Epoche=5319\n",
      "Epsilon=0.691050 Action_times=3740695 Epoche=5320\n",
      "Epsilon=0.690941 Action_times=3742287 Epoche=5321\n",
      "Epsilon=0.690915 Action_times=3742669 Epoche=5322\n",
      "Epsilon=0.690836 Action_times=3743839 Epoche=5323\n",
      "Epsilon=0.690759 Action_times=3744970 Epoche=5324\n",
      "Epsilon=0.690673 Action_times=3746224 Epoche=5325\n",
      "Epsilon=0.690550 Action_times=3748032 Epoche=5326\n",
      "Epsilon=0.690522 Action_times=3748446 Epoche=5327\n",
      "Epsilon=0.690365 Action_times=3750753 Epoche=5328\n",
      "Epsilon=0.690214 Action_times=3752972 Epoche=5329\n",
      "Epsilon=0.690119 Action_times=3754372 Epoche=5330\n",
      "Epsilon=0.689957 Action_times=3756748 Epoche=5331\n",
      "Epsilon=0.689858 Action_times=3758203 Epoche=5332\n",
      "Epsilon=0.689743 Action_times=3759901 Epoche=5333\n",
      "Epsilon=0.689674 Action_times=3760916 Epoche=5334\n",
      "Epsilon=0.689596 Action_times=3762070 Epoche=5335\n",
      "Epsilon=0.689529 Action_times=3763050 Epoche=5336\n",
      "Epsilon=0.689463 Action_times=3764017 Epoche=5337\n",
      "Epsilon=0.689383 Action_times=3765206 Epoche=5338\n",
      "Epsilon=0.689320 Action_times=3766123 Epoche=5339\n",
      "Epsilon=0.689219 Action_times=3767613 Epoche=5340\n",
      "Epsilon=0.689189 Action_times=3768057 Epoche=5341\n",
      "Epsilon=0.689152 Action_times=3768606 Epoche=5342\n",
      "Epsilon=0.689118 Action_times=3769101 Epoche=5343\n",
      "Epsilon=0.689055 Action_times=3770035 Epoche=5344\n",
      "Epsilon=0.688979 Action_times=3771147 Epoche=5345\n",
      "Epsilon=0.688945 Action_times=3771651 Epoche=5346\n",
      "Epsilon=0.688860 Action_times=3772901 Epoche=5347\n",
      "Epsilon=0.688825 Action_times=3773409 Epoche=5348\n",
      "Epsilon=0.688820 Action_times=3773490 Epoche=5349\n",
      "Epsilon=0.688782 Action_times=3774043 Epoche=5350\n",
      "Epsilon=0.688720 Action_times=3774960 Epoche=5351\n",
      "Epsilon=0.688658 Action_times=3775876 Epoche=5352\n",
      "Epsilon=0.688567 Action_times=3777218 Epoche=5353\n",
      "Epsilon=0.688555 Action_times=3777394 Epoche=5354\n",
      "Epsilon=0.688497 Action_times=3778242 Epoche=5355\n",
      "Epsilon=0.688444 Action_times=3779023 Epoche=5356\n",
      "Epsilon=0.688377 Action_times=3780019 Epoche=5357\n",
      "Epsilon=0.688335 Action_times=3780632 Epoche=5358\n",
      "Epsilon=0.688311 Action_times=3780988 Epoche=5359\n",
      "Epsilon=0.688273 Action_times=3781549 Epoche=5360\n",
      "Epsilon=0.688235 Action_times=3782109 Epoche=5361\n",
      "Epsilon=0.688196 Action_times=3782683 Epoche=5362\n",
      "Epsilon=0.688142 Action_times=3783479 Epoche=5363\n",
      "Epsilon=0.688090 Action_times=3784249 Epoche=5364\n",
      "Epsilon=0.688041 Action_times=3784968 Epoche=5365\n",
      "Epsilon=0.687937 Action_times=3786510 Epoche=5366\n",
      "Epsilon=0.687850 Action_times=3787789 Epoche=5367\n",
      "Epsilon=0.687775 Action_times=3788902 Epoche=5368\n",
      "Epsilon=0.687718 Action_times=3789733 Epoche=5369\n",
      "Epsilon=0.687682 Action_times=3790265 Epoche=5370\n",
      "Epsilon=0.687620 Action_times=3791181 Epoche=5371\n",
      "Epsilon=0.687514 Action_times=3792741 Epoche=5372\n",
      "Epsilon=0.687468 Action_times=3793419 Epoche=5373\n",
      "Epsilon=0.687384 Action_times=3794667 Epoche=5374\n",
      "Epsilon=0.687332 Action_times=3795439 Epoche=5375\n",
      "Epsilon=0.687276 Action_times=3796257 Epoche=5376\n",
      "Epsilon=0.687230 Action_times=3796940 Epoche=5377\n",
      "Epsilon=0.687166 Action_times=3797887 Epoche=5378\n",
      "Epsilon=0.687095 Action_times=3798938 Epoche=5379\n",
      "Epsilon=0.687069 Action_times=3799323 Epoche=5380\n",
      "Epsilon=0.686986 Action_times=3800539 Epoche=5381\n",
      "Epsilon=0.686893 Action_times=3801910 Epoche=5382\n",
      "Epsilon=0.686821 Action_times=3802976 Epoche=5383\n",
      "Epsilon=0.686748 Action_times=3804058 Epoche=5384\n",
      "Epsilon=0.686617 Action_times=3805995 Epoche=5385\n",
      "Epsilon=0.686501 Action_times=3807716 Epoche=5386\n",
      "Epsilon=0.686452 Action_times=3808438 Epoche=5387\n",
      "Epsilon=0.686375 Action_times=3809577 Epoche=5388\n",
      "Epsilon=0.686350 Action_times=3809942 Epoche=5389\n",
      "Epsilon=0.686328 Action_times=3810265 Epoche=5390\n",
      "Epsilon=0.686314 Action_times=3810478 Epoche=5391\n",
      "Epsilon=0.686253 Action_times=3811382 Epoche=5392\n",
      "Epsilon=0.686167 Action_times=3812648 Epoche=5393\n",
      "Epsilon=0.686075 Action_times=3814005 Epoche=5394\n",
      "Epsilon=0.685989 Action_times=3815284 Epoche=5395\n",
      "Epsilon=0.685899 Action_times=3816610 Epoche=5396\n",
      "Epsilon=0.685810 Action_times=3817929 Epoche=5397\n",
      "Epsilon=0.685669 Action_times=3820023 Epoche=5398\n",
      "Epsilon=0.685490 Action_times=3822661 Epoche=5399\n",
      "Epsilon=0.685437 Action_times=3823449 Epoche=5400\n",
      "Epsilon=0.685422 Action_times=3823678 Epoche=5401\n",
      "Epsilon=0.685356 Action_times=3824643 Epoche=5402\n",
      "Epsilon=0.685264 Action_times=3826010 Epoche=5403\n",
      "Epsilon=0.685098 Action_times=3828476 Epoche=5404\n",
      "Epsilon=0.685074 Action_times=3828823 Epoche=5405\n",
      "Epsilon=0.685026 Action_times=3829539 Epoche=5406\n",
      "Epsilon=0.685005 Action_times=3829843 Epoche=5407\n",
      "Epsilon=0.684953 Action_times=3830621 Epoche=5408\n",
      "Epsilon=0.684918 Action_times=3831135 Epoche=5409\n",
      "Epsilon=0.684865 Action_times=3831923 Epoche=5410\n",
      "Epsilon=0.684747 Action_times=3833672 Epoche=5411\n",
      "Epsilon=0.684694 Action_times=3834460 Epoche=5412\n",
      "Epsilon=0.684641 Action_times=3835240 Epoche=5413\n",
      "Epsilon=0.684581 Action_times=3836138 Epoche=5414\n",
      "Epsilon=0.684362 Action_times=3839372 Epoche=5415\n",
      "Epsilon=0.684273 Action_times=3840699 Epoche=5416\n",
      "Epsilon=0.684247 Action_times=3841083 Epoche=5417\n",
      "Epsilon=0.684214 Action_times=3841574 Epoche=5418\n",
      "Epsilon=0.684184 Action_times=3842024 Epoche=5419\n",
      "Epsilon=0.684157 Action_times=3842426 Epoche=5420\n",
      "Epsilon=0.683965 Action_times=3845266 Epoche=5421\n",
      "Epsilon=0.683925 Action_times=3845864 Epoche=5422\n",
      "Epsilon=0.683868 Action_times=3846708 Epoche=5423\n",
      "Epsilon=0.683868 Action_times=3846714 Epoche=5424\n",
      "Epsilon=0.683837 Action_times=3847174 Epoche=5425\n",
      "Epsilon=0.683814 Action_times=3847501 Epoche=5426\n",
      "Epsilon=0.683614 Action_times=3850472 Epoche=5427\n",
      "Epsilon=0.683541 Action_times=3851554 Epoche=5428\n",
      "Epsilon=0.683394 Action_times=3853745 Epoche=5429\n",
      "Epsilon=0.683338 Action_times=3854575 Epoche=5430\n",
      "Epsilon=0.683298 Action_times=3855163 Epoche=5431\n",
      "Epsilon=0.683255 Action_times=3855809 Epoche=5432\n",
      "Epsilon=0.683175 Action_times=3856995 Epoche=5433\n",
      "Epsilon=0.683073 Action_times=3858508 Epoche=5434\n",
      "Epsilon=0.683034 Action_times=3859096 Epoche=5435\n",
      "Epsilon=0.682970 Action_times=3860041 Epoche=5436\n",
      "Epsilon=0.682880 Action_times=3861372 Epoche=5437\n",
      "Epsilon=0.682842 Action_times=3861950 Epoche=5438\n",
      "Epsilon=0.682730 Action_times=3863605 Epoche=5439\n",
      "Epsilon=0.682650 Action_times=3864805 Epoche=5440\n",
      "Epsilon=0.682604 Action_times=3865480 Epoche=5441\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.682461 Action_times=3867604 Epoche=5442\n",
      "Epsilon=0.682436 Action_times=3867975 Epoche=5443\n",
      "Epsilon=0.682367 Action_times=3869008 Epoche=5444\n",
      "Epsilon=0.682318 Action_times=3869736 Epoche=5445\n",
      "Epsilon=0.682247 Action_times=3870789 Epoche=5446\n",
      "Epsilon=0.682193 Action_times=3871589 Epoche=5447\n",
      "Epsilon=0.682100 Action_times=3872980 Epoche=5448\n",
      "Epsilon=0.681961 Action_times=3875049 Epoche=5449\n",
      "Epsilon=0.681843 Action_times=3876805 Epoche=5450\n",
      "Epsilon=0.681831 Action_times=3876986 Epoche=5451\n",
      "Epsilon=0.681828 Action_times=3877026 Epoche=5452\n",
      "Epsilon=0.681750 Action_times=3878189 Epoche=5453\n",
      "Epsilon=0.681658 Action_times=3879562 Epoche=5454\n",
      "Epsilon=0.681599 Action_times=3880439 Epoche=5455\n",
      "Epsilon=0.681562 Action_times=3880991 Epoche=5456\n",
      "Epsilon=0.681472 Action_times=3882323 Epoche=5457\n",
      "Epsilon=0.681393 Action_times=3883507 Epoche=5458\n",
      "Epsilon=0.681325 Action_times=3884521 Epoche=5459\n",
      "Epsilon=0.681119 Action_times=3887583 Epoche=5460\n",
      "Epsilon=0.680935 Action_times=3890322 Epoche=5461\n",
      "Epsilon=0.680911 Action_times=3890686 Epoche=5462\n",
      "Epsilon=0.680840 Action_times=3891748 Epoche=5463\n",
      "Epsilon=0.680777 Action_times=3892688 Epoche=5464\n",
      "Epsilon=0.680653 Action_times=3894530 Epoche=5465\n",
      "Epsilon=0.680474 Action_times=3897206 Epoche=5466\n",
      "Epsilon=0.680453 Action_times=3897509 Epoche=5467\n",
      "Epsilon=0.680435 Action_times=3897777 Epoche=5468\n",
      "Epsilon=0.680384 Action_times=3898550 Epoche=5469\n",
      "Epsilon=0.680373 Action_times=3898710 Epoche=5470\n",
      "Epsilon=0.680255 Action_times=3900466 Epoche=5471\n",
      "Epsilon=0.680207 Action_times=3901180 Epoche=5472\n",
      "Epsilon=0.680187 Action_times=3901488 Epoche=5473\n",
      "Epsilon=0.680101 Action_times=3902770 Epoche=5474\n",
      "Epsilon=0.680086 Action_times=3902986 Epoche=5475\n",
      "Epsilon=0.680002 Action_times=3904241 Epoche=5476\n",
      "Epsilon=0.679890 Action_times=3905913 Epoche=5477\n",
      "Epsilon=0.679866 Action_times=3906274 Epoche=5478\n",
      "Epsilon=0.679820 Action_times=3906955 Epoche=5479\n",
      "Epsilon=0.679769 Action_times=3907715 Epoche=5480\n",
      "Epsilon=0.679748 Action_times=3908036 Epoche=5481\n",
      "Epsilon=0.679612 Action_times=3910058 Epoche=5482\n",
      "Epsilon=0.679544 Action_times=3911074 Epoche=5483\n",
      "Epsilon=0.679485 Action_times=3911955 Epoche=5484\n",
      "Epsilon=0.679484 Action_times=3911973 Epoche=5485\n",
      "Epsilon=0.679378 Action_times=3913556 Epoche=5486\n",
      "Epsilon=0.679343 Action_times=3914087 Epoche=5487\n",
      "Epsilon=0.679258 Action_times=3915358 Epoche=5488\n",
      "Epsilon=0.679219 Action_times=3915934 Epoche=5489\n",
      "Epsilon=0.679186 Action_times=3916429 Epoche=5490\n",
      "Epsilon=0.679135 Action_times=3917191 Epoche=5491\n",
      "Epsilon=0.679077 Action_times=3918060 Epoche=5492\n",
      "Epsilon=0.679069 Action_times=3918173 Epoche=5493\n",
      "Epsilon=0.679065 Action_times=3918241 Epoche=5494\n",
      "Epsilon=0.679000 Action_times=3919216 Epoche=5495\n",
      "Epsilon=0.678906 Action_times=3920621 Epoche=5496\n",
      "Epsilon=0.678743 Action_times=3923044 Epoche=5497\n",
      "Epsilon=0.678701 Action_times=3923672 Epoche=5498\n",
      "Epsilon=0.678577 Action_times=3925539 Epoche=5499\n",
      "Epsilon=0.678438 Action_times=3927610 Epoche=5500\n",
      "Epsilon=0.678413 Action_times=3927991 Epoche=5501\n",
      "Epsilon=0.678276 Action_times=3930034 Epoche=5502\n",
      "Epsilon=0.678232 Action_times=3930694 Epoche=5503\n",
      "Epsilon=0.678163 Action_times=3931727 Epoche=5504\n",
      "Epsilon=0.678116 Action_times=3932433 Epoche=5505\n",
      "Epsilon=0.678010 Action_times=3934023 Epoche=5506\n",
      "Epsilon=0.677929 Action_times=3935226 Epoche=5507\n",
      "Epsilon=0.677899 Action_times=3935676 Epoche=5508\n",
      "Epsilon=0.677831 Action_times=3936700 Epoche=5509\n",
      "Epsilon=0.677781 Action_times=3937440 Epoche=5510\n",
      "Epsilon=0.677674 Action_times=3939056 Epoche=5511\n",
      "Epsilon=0.677577 Action_times=3940501 Epoche=5512\n",
      "Epsilon=0.677541 Action_times=3941042 Epoche=5513\n",
      "Epsilon=0.677474 Action_times=3942046 Epoche=5514\n",
      "Epsilon=0.677344 Action_times=3943990 Epoche=5515\n",
      "Epsilon=0.677238 Action_times=3945585 Epoche=5516\n",
      "Epsilon=0.677166 Action_times=3946658 Epoche=5517\n",
      "Epsilon=0.677071 Action_times=3948082 Epoche=5518\n",
      "Epsilon=0.676971 Action_times=3949589 Epoche=5519\n",
      "Epsilon=0.676952 Action_times=3949869 Epoche=5520\n",
      "Epsilon=0.676855 Action_times=3951323 Epoche=5521\n",
      "Epsilon=0.676779 Action_times=3952461 Epoche=5522\n",
      "Epsilon=0.676725 Action_times=3953269 Epoche=5523\n",
      "Epsilon=0.676647 Action_times=3954436 Epoche=5524\n",
      "Epsilon=0.676598 Action_times=3955184 Epoche=5525\n",
      "Epsilon=0.676456 Action_times=3957308 Epoche=5526\n",
      "Epsilon=0.676425 Action_times=3957770 Epoche=5527\n",
      "Epsilon=0.676335 Action_times=3959122 Epoche=5528\n",
      "Epsilon=0.676283 Action_times=3959902 Epoche=5529\n",
      "Epsilon=0.676159 Action_times=3961772 Epoche=5530\n",
      "Epsilon=0.676142 Action_times=3962018 Epoche=5531\n",
      "Epsilon=0.676118 Action_times=3962379 Epoche=5532\n",
      "Epsilon=0.675928 Action_times=3965230 Epoche=5533\n",
      "Epsilon=0.675891 Action_times=3965793 Epoche=5534\n",
      "Epsilon=0.675842 Action_times=3966529 Epoche=5535\n",
      "Epsilon=0.675579 Action_times=3970474 Epoche=5536\n",
      "Epsilon=0.675513 Action_times=3971473 Epoche=5537\n",
      "Epsilon=0.675458 Action_times=3972301 Epoche=5538\n",
      "Epsilon=0.675340 Action_times=3974063 Epoche=5539\n",
      "Epsilon=0.675266 Action_times=3975185 Epoche=5540\n",
      "Epsilon=0.675016 Action_times=3978932 Epoche=5541\n",
      "Epsilon=0.674913 Action_times=3980482 Epoche=5542\n",
      "Epsilon=0.674821 Action_times=3981878 Epoche=5543\n",
      "Epsilon=0.674667 Action_times=3984188 Epoche=5544\n",
      "Epsilon=0.674630 Action_times=3984742 Epoche=5545\n",
      "Epsilon=0.674515 Action_times=3986474 Epoche=5546\n",
      "Epsilon=0.674460 Action_times=3987309 Epoche=5547\n",
      "Epsilon=0.674416 Action_times=3987972 Epoche=5548\n",
      "Epsilon=0.674347 Action_times=3989009 Epoche=5549\n",
      "Epsilon=0.674301 Action_times=3989689 Epoche=5550\n",
      "Epsilon=0.674291 Action_times=3989843 Epoche=5551\n",
      "Epsilon=0.674153 Action_times=3991928 Epoche=5552\n",
      "Epsilon=0.674127 Action_times=3992315 Epoche=5553\n",
      "Epsilon=0.674116 Action_times=3992483 Epoche=5554\n",
      "Epsilon=0.674018 Action_times=3993964 Epoche=5555\n",
      "Epsilon=0.674006 Action_times=3994144 Epoche=5556\n",
      "Epsilon=0.673873 Action_times=3996134 Epoche=5557\n",
      "Epsilon=0.673738 Action_times=3998171 Epoche=5558\n",
      "Epsilon=0.673644 Action_times=3999597 Epoche=5559\n",
      "Epsilon=0.673568 Action_times=4000734 Epoche=5560\n",
      "Epsilon=0.673470 Action_times=4002214 Epoche=5561\n",
      "Epsilon=0.673429 Action_times=4002835 Epoche=5562\n",
      "Epsilon=0.673412 Action_times=4003085 Epoche=5563\n",
      "Epsilon=0.673327 Action_times=4004369 Epoche=5564\n",
      "Epsilon=0.673258 Action_times=4005416 Epoche=5565\n",
      "Epsilon=0.673237 Action_times=4005731 Epoche=5566\n",
      "Epsilon=0.673157 Action_times=4006939 Epoche=5567\n",
      "Epsilon=0.673075 Action_times=4008172 Epoche=5568\n",
      "Epsilon=0.673012 Action_times=4009122 Epoche=5569\n",
      "Epsilon=0.672966 Action_times=4009811 Epoche=5570\n",
      "Epsilon=0.672900 Action_times=4010809 Epoche=5571\n",
      "Epsilon=0.672852 Action_times=4011531 Epoche=5572\n",
      "Epsilon=0.672830 Action_times=4011857 Epoche=5573\n",
      "Epsilon=0.672752 Action_times=4013045 Epoche=5574\n",
      "Epsilon=0.672598 Action_times=4015359 Epoche=5575\n",
      "Epsilon=0.672485 Action_times=4017069 Epoche=5576\n",
      "Epsilon=0.672422 Action_times=4018026 Epoche=5577\n",
      "Epsilon=0.672287 Action_times=4020066 Epoche=5578\n",
      "Epsilon=0.672202 Action_times=4021345 Epoche=5579\n",
      "Epsilon=0.672182 Action_times=4021648 Epoche=5580\n",
      "Epsilon=0.672087 Action_times=4023083 Epoche=5581\n",
      "Epsilon=0.672042 Action_times=4023754 Epoche=5582\n",
      "Epsilon=0.672015 Action_times=4024161 Epoche=5583\n",
      "Epsilon=0.671974 Action_times=4024794 Epoche=5584\n",
      "Epsilon=0.671907 Action_times=4025797 Epoche=5585\n",
      "Epsilon=0.671778 Action_times=4027745 Epoche=5586\n",
      "Epsilon=0.671719 Action_times=4028634 Epoche=5587\n",
      "Epsilon=0.671680 Action_times=4029223 Epoche=5588\n",
      "Epsilon=0.671624 Action_times=4030081 Epoche=5589\n",
      "Epsilon=0.671613 Action_times=4030237 Epoche=5590\n",
      "Epsilon=0.671603 Action_times=4030395 Epoche=5591\n",
      "Epsilon=0.671576 Action_times=4030801 Epoche=5592\n",
      "Epsilon=0.671468 Action_times=4032428 Epoche=5593\n",
      "Epsilon=0.671441 Action_times=4032841 Epoche=5594\n",
      "Epsilon=0.671388 Action_times=4033637 Epoche=5595\n",
      "Epsilon=0.671351 Action_times=4034208 Epoche=5596\n",
      "Epsilon=0.671315 Action_times=4034743 Epoche=5597\n",
      "Epsilon=0.671202 Action_times=4036452 Epoche=5598\n",
      "Epsilon=0.671061 Action_times=4038588 Epoche=5599\n",
      "Epsilon=0.670959 Action_times=4040135 Epoche=5600\n",
      "Epsilon=0.670935 Action_times=4040496 Epoche=5601\n",
      "Epsilon=0.670822 Action_times=4042210 Epoche=5602\n",
      "Epsilon=0.670734 Action_times=4043535 Epoche=5603\n",
      "Epsilon=0.670580 Action_times=4045874 Epoche=5604\n",
      "Epsilon=0.670525 Action_times=4046695 Epoche=5605\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.670517 Action_times=4046821 Epoche=5606\n",
      "Epsilon=0.670384 Action_times=4048834 Epoche=5607\n",
      "Epsilon=0.670326 Action_times=4049708 Epoche=5608\n",
      "Epsilon=0.670244 Action_times=4050949 Epoche=5609\n",
      "Epsilon=0.670115 Action_times=4052915 Epoche=5610\n",
      "Epsilon=0.669991 Action_times=4054785 Epoche=5611\n",
      "Epsilon=0.669943 Action_times=4055519 Epoche=5612\n",
      "Epsilon=0.669938 Action_times=4055588 Epoche=5613\n",
      "Epsilon=0.669885 Action_times=4056397 Epoche=5614\n",
      "Epsilon=0.669783 Action_times=4057937 Epoche=5615\n",
      "Epsilon=0.669724 Action_times=4058828 Epoche=5616\n",
      "Epsilon=0.669645 Action_times=4060025 Epoche=5617\n",
      "Epsilon=0.669550 Action_times=4061472 Epoche=5618\n",
      "Epsilon=0.669440 Action_times=4063132 Epoche=5619\n",
      "Epsilon=0.669368 Action_times=4064238 Epoche=5620\n",
      "Epsilon=0.669267 Action_times=4065763 Epoche=5621\n",
      "Epsilon=0.669241 Action_times=4066152 Epoche=5622\n",
      "Epsilon=0.669154 Action_times=4067483 Epoche=5623\n",
      "Epsilon=0.669101 Action_times=4068288 Epoche=5624\n",
      "Epsilon=0.668976 Action_times=4070177 Epoche=5625\n",
      "Epsilon=0.668864 Action_times=4071876 Epoche=5626\n",
      "Epsilon=0.668799 Action_times=4072872 Epoche=5627\n",
      "Epsilon=0.668750 Action_times=4073611 Epoche=5628\n",
      "Epsilon=0.668684 Action_times=4074613 Epoche=5629\n",
      "Epsilon=0.668666 Action_times=4074880 Epoche=5630\n",
      "Epsilon=0.668621 Action_times=4075573 Epoche=5631\n",
      "Epsilon=0.668535 Action_times=4076870 Epoche=5632\n",
      "Epsilon=0.668382 Action_times=4079198 Epoche=5633\n",
      "Epsilon=0.668357 Action_times=4079571 Epoche=5634\n",
      "Epsilon=0.668285 Action_times=4080675 Epoche=5635\n",
      "Epsilon=0.668259 Action_times=4081071 Epoche=5636\n",
      "Epsilon=0.668230 Action_times=4081504 Epoche=5637\n",
      "Epsilon=0.668147 Action_times=4082759 Epoche=5638\n",
      "Epsilon=0.668088 Action_times=4083666 Epoche=5639\n",
      "Epsilon=0.668072 Action_times=4083913 Epoche=5640\n",
      "Epsilon=0.668015 Action_times=4084769 Epoche=5641\n",
      "Epsilon=0.667966 Action_times=4085513 Epoche=5642\n",
      "Epsilon=0.667902 Action_times=4086491 Epoche=5643\n",
      "Epsilon=0.667843 Action_times=4087382 Epoche=5644\n",
      "Epsilon=0.667835 Action_times=4087513 Epoche=5645\n",
      "Epsilon=0.667780 Action_times=4088351 Epoche=5646\n",
      "Epsilon=0.667666 Action_times=4090078 Epoche=5647\n",
      "Epsilon=0.667574 Action_times=4091483 Epoche=5648\n",
      "Epsilon=0.667431 Action_times=4093655 Epoche=5649\n",
      "Epsilon=0.667303 Action_times=4095594 Epoche=5650\n",
      "Epsilon=0.667225 Action_times=4096791 Epoche=5651\n",
      "Epsilon=0.667202 Action_times=4097135 Epoche=5652\n",
      "Epsilon=0.667178 Action_times=4097495 Epoche=5653\n",
      "Epsilon=0.667114 Action_times=4098467 Epoche=5654\n",
      "Epsilon=0.667069 Action_times=4099158 Epoche=5655\n",
      "Epsilon=0.667055 Action_times=4099365 Epoche=5656\n",
      "Epsilon=0.666966 Action_times=4100728 Epoche=5657\n",
      "Epsilon=0.666823 Action_times=4102906 Epoche=5658\n",
      "Epsilon=0.666801 Action_times=4103232 Epoche=5659\n",
      "Epsilon=0.666704 Action_times=4104708 Epoche=5660\n",
      "Epsilon=0.666683 Action_times=4105033 Epoche=5661\n",
      "Epsilon=0.666555 Action_times=4106982 Epoche=5662\n",
      "Epsilon=0.666524 Action_times=4107461 Epoche=5663\n",
      "Epsilon=0.666487 Action_times=4108024 Epoche=5664\n",
      "Epsilon=0.666297 Action_times=4110922 Epoche=5665\n",
      "Epsilon=0.666244 Action_times=4111717 Epoche=5666\n",
      "Epsilon=0.666164 Action_times=4112937 Epoche=5667\n",
      "Epsilon=0.666107 Action_times=4113818 Epoche=5668\n",
      "Epsilon=0.666001 Action_times=4115433 Epoche=5669\n",
      "Epsilon=0.665992 Action_times=4115559 Epoche=5670\n",
      "Epsilon=0.665822 Action_times=4118150 Epoche=5671\n",
      "Epsilon=0.665742 Action_times=4119382 Epoche=5672\n",
      "Epsilon=0.665712 Action_times=4119828 Epoche=5673\n",
      "Epsilon=0.665644 Action_times=4120872 Epoche=5674\n",
      "Epsilon=0.665523 Action_times=4122719 Epoche=5675\n",
      "Epsilon=0.665513 Action_times=4122870 Epoche=5676\n",
      "Epsilon=0.665418 Action_times=4124324 Epoche=5677\n",
      "Epsilon=0.665337 Action_times=4125558 Epoche=5678\n",
      "Epsilon=0.665323 Action_times=4125760 Epoche=5679\n",
      "Epsilon=0.665269 Action_times=4126586 Epoche=5680\n",
      "Epsilon=0.665228 Action_times=4127217 Epoche=5681\n",
      "Epsilon=0.665184 Action_times=4127885 Epoche=5682\n",
      "Epsilon=0.665115 Action_times=4128936 Epoche=5683\n",
      "Epsilon=0.665076 Action_times=4129534 Epoche=5684\n",
      "Epsilon=0.665011 Action_times=4130522 Epoche=5685\n",
      "Epsilon=0.664983 Action_times=4130960 Epoche=5686\n",
      "Epsilon=0.664931 Action_times=4131747 Epoche=5687\n",
      "Epsilon=0.664893 Action_times=4132335 Epoche=5688\n",
      "Epsilon=0.664823 Action_times=4133394 Epoche=5689\n",
      "Epsilon=0.664792 Action_times=4133875 Epoche=5690\n",
      "Epsilon=0.664628 Action_times=4136377 Epoche=5691\n",
      "Epsilon=0.664608 Action_times=4136687 Epoche=5692\n",
      "Epsilon=0.664532 Action_times=4137842 Epoche=5693\n",
      "Epsilon=0.664479 Action_times=4138655 Epoche=5694\n",
      "Epsilon=0.664366 Action_times=4140375 Epoche=5695\n",
      "Epsilon=0.664338 Action_times=4140814 Epoche=5696\n",
      "Epsilon=0.664241 Action_times=4142296 Epoche=5697\n",
      "Epsilon=0.664150 Action_times=4143678 Epoche=5698\n",
      "Epsilon=0.664137 Action_times=4143876 Epoche=5699\n",
      "Epsilon=0.664088 Action_times=4144625 Epoche=5700\n",
      "Epsilon=0.664069 Action_times=4144920 Epoche=5701\n",
      "Epsilon=0.664059 Action_times=4145071 Epoche=5702\n",
      "Epsilon=0.663986 Action_times=4146191 Epoche=5703\n",
      "Epsilon=0.663959 Action_times=4146597 Epoche=5704\n",
      "Epsilon=0.663925 Action_times=4147130 Epoche=5705\n",
      "Epsilon=0.663916 Action_times=4147263 Epoche=5706\n",
      "Epsilon=0.663810 Action_times=4148888 Epoche=5707\n",
      "Epsilon=0.663676 Action_times=4150929 Epoche=5708\n",
      "Epsilon=0.663643 Action_times=4151432 Epoche=5709\n",
      "Epsilon=0.663590 Action_times=4152241 Epoche=5710\n",
      "Epsilon=0.663540 Action_times=4153014 Epoche=5711\n",
      "Epsilon=0.663513 Action_times=4153425 Epoche=5712\n",
      "Epsilon=0.663422 Action_times=4154824 Epoche=5713\n",
      "Epsilon=0.663306 Action_times=4156591 Epoche=5714\n",
      "Epsilon=0.663289 Action_times=4156859 Epoche=5715\n",
      "Epsilon=0.663223 Action_times=4157861 Epoche=5716\n",
      "Epsilon=0.663165 Action_times=4158755 Epoche=5717\n",
      "Epsilon=0.663038 Action_times=4160696 Epoche=5718\n",
      "Epsilon=0.662947 Action_times=4162089 Epoche=5719\n",
      "Epsilon=0.662880 Action_times=4163114 Epoche=5720\n",
      "Epsilon=0.662793 Action_times=4164442 Epoche=5721\n",
      "Epsilon=0.662679 Action_times=4166194 Epoche=5722\n",
      "Epsilon=0.662619 Action_times=4167110 Epoche=5723\n",
      "Epsilon=0.662603 Action_times=4167360 Epoche=5724\n",
      "Epsilon=0.662553 Action_times=4168126 Epoche=5725\n",
      "Epsilon=0.662498 Action_times=4168965 Epoche=5726\n",
      "Epsilon=0.662427 Action_times=4170059 Epoche=5727\n",
      "Epsilon=0.662337 Action_times=4171436 Epoche=5728\n",
      "Epsilon=0.662288 Action_times=4172185 Epoche=5729\n",
      "Epsilon=0.662234 Action_times=4173012 Epoche=5730\n",
      "Epsilon=0.662123 Action_times=4174714 Epoche=5731\n",
      "Epsilon=0.662080 Action_times=4175378 Epoche=5732\n",
      "Epsilon=0.662073 Action_times=4175477 Epoche=5733\n",
      "Epsilon=0.661993 Action_times=4176707 Epoche=5734\n",
      "Epsilon=0.661918 Action_times=4177854 Epoche=5735\n",
      "Epsilon=0.661866 Action_times=4178666 Epoche=5736\n",
      "Epsilon=0.661810 Action_times=4179519 Epoche=5737\n",
      "Epsilon=0.661773 Action_times=4180085 Epoche=5738\n",
      "Epsilon=0.661728 Action_times=4180772 Epoche=5739\n",
      "Epsilon=0.661637 Action_times=4182168 Epoche=5740\n",
      "Epsilon=0.661595 Action_times=4182818 Epoche=5741\n",
      "Epsilon=0.661571 Action_times=4183187 Epoche=5742\n",
      "Epsilon=0.661530 Action_times=4183817 Epoche=5743\n",
      "Epsilon=0.661479 Action_times=4184605 Epoche=5744\n",
      "Epsilon=0.661433 Action_times=4185307 Epoche=5745\n",
      "Epsilon=0.661362 Action_times=4186400 Epoche=5746\n",
      "Epsilon=0.661269 Action_times=4187819 Epoche=5747\n",
      "Epsilon=0.661242 Action_times=4188237 Epoche=5748\n",
      "Epsilon=0.661205 Action_times=4188800 Epoche=5749\n",
      "Epsilon=0.661189 Action_times=4189054 Epoche=5750\n",
      "Epsilon=0.661157 Action_times=4189536 Epoche=5751\n",
      "Epsilon=0.661049 Action_times=4191195 Epoche=5752\n",
      "Epsilon=0.661022 Action_times=4191614 Epoche=5753\n",
      "Epsilon=0.660924 Action_times=4193120 Epoche=5754\n",
      "Epsilon=0.660883 Action_times=4193752 Epoche=5755\n",
      "Epsilon=0.660734 Action_times=4196047 Epoche=5756\n",
      "Epsilon=0.660685 Action_times=4196787 Epoche=5757\n",
      "Epsilon=0.660618 Action_times=4197826 Epoche=5758\n",
      "Epsilon=0.660589 Action_times=4198273 Epoche=5759\n",
      "Epsilon=0.660583 Action_times=4198355 Epoche=5760\n",
      "Epsilon=0.660559 Action_times=4198731 Epoche=5761\n",
      "Epsilon=0.660518 Action_times=4199356 Epoche=5762\n",
      "Epsilon=0.660505 Action_times=4199561 Epoche=5763\n",
      "Epsilon=0.660491 Action_times=4199781 Epoche=5764\n",
      "Epsilon=0.660479 Action_times=4199956 Epoche=5765\n",
      "Epsilon=0.660432 Action_times=4200684 Epoche=5766\n",
      "Epsilon=0.660385 Action_times=4201407 Epoche=5767\n",
      "Epsilon=0.660317 Action_times=4202455 Epoche=5768\n",
      "Epsilon=0.660262 Action_times=4203301 Epoche=5769\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.660158 Action_times=4204900 Epoche=5770\n",
      "Epsilon=0.660142 Action_times=4205135 Epoche=5771\n",
      "Epsilon=0.660112 Action_times=4205602 Epoche=5772\n",
      "Epsilon=0.659979 Action_times=4207644 Epoche=5773\n",
      "Epsilon=0.659964 Action_times=4207881 Epoche=5774\n",
      "Epsilon=0.659900 Action_times=4208869 Epoche=5775\n",
      "Epsilon=0.659880 Action_times=4209176 Epoche=5776\n",
      "Epsilon=0.659851 Action_times=4209616 Epoche=5777\n",
      "Epsilon=0.659787 Action_times=4210609 Epoche=5778\n",
      "Epsilon=0.659758 Action_times=4211055 Epoche=5779\n",
      "Epsilon=0.659692 Action_times=4212067 Epoche=5780\n",
      "Epsilon=0.659656 Action_times=4212624 Epoche=5781\n",
      "Epsilon=0.659511 Action_times=4214847 Epoche=5782\n",
      "Epsilon=0.659376 Action_times=4216932 Epoche=5783\n",
      "Epsilon=0.659330 Action_times=4217644 Epoche=5784\n",
      "Epsilon=0.659303 Action_times=4218059 Epoche=5785\n",
      "Epsilon=0.659266 Action_times=4218626 Epoche=5786\n",
      "Epsilon=0.659194 Action_times=4219730 Epoche=5787\n",
      "Epsilon=0.659089 Action_times=4221352 Epoche=5788\n",
      "Epsilon=0.659023 Action_times=4222373 Epoche=5789\n",
      "Epsilon=0.658962 Action_times=4223306 Epoche=5790\n",
      "Epsilon=0.658902 Action_times=4224229 Epoche=5791\n",
      "Epsilon=0.658882 Action_times=4224537 Epoche=5792\n",
      "Epsilon=0.658765 Action_times=4226346 Epoche=5793\n",
      "Epsilon=0.658696 Action_times=4227401 Epoche=5794\n",
      "Epsilon=0.658635 Action_times=4228345 Epoche=5795\n",
      "Epsilon=0.658598 Action_times=4228921 Epoche=5796\n",
      "Epsilon=0.658582 Action_times=4229170 Epoche=5797\n",
      "Epsilon=0.658508 Action_times=4230303 Epoche=5798\n",
      "Epsilon=0.658372 Action_times=4232399 Epoche=5799\n",
      "Epsilon=0.658359 Action_times=4232597 Epoche=5800\n",
      "Epsilon=0.658340 Action_times=4232891 Epoche=5801\n",
      "Epsilon=0.658302 Action_times=4233478 Epoche=5802\n",
      "Epsilon=0.658254 Action_times=4234229 Epoche=5803\n",
      "Epsilon=0.658239 Action_times=4234458 Epoche=5804\n",
      "Epsilon=0.658186 Action_times=4235265 Epoche=5805\n",
      "Epsilon=0.658104 Action_times=4236544 Epoche=5806\n",
      "Epsilon=0.657976 Action_times=4238518 Epoche=5807\n",
      "Epsilon=0.657921 Action_times=4239369 Epoche=5808\n",
      "Epsilon=0.657897 Action_times=4239727 Epoche=5809\n",
      "Epsilon=0.657749 Action_times=4242009 Epoche=5810\n",
      "Epsilon=0.657631 Action_times=4243832 Epoche=5811\n",
      "Epsilon=0.657478 Action_times=4246196 Epoche=5812\n",
      "Epsilon=0.657371 Action_times=4247853 Epoche=5813\n",
      "Epsilon=0.657290 Action_times=4249110 Epoche=5814\n",
      "Epsilon=0.657212 Action_times=4250308 Epoche=5815\n",
      "Epsilon=0.657159 Action_times=4251123 Epoche=5816\n",
      "Epsilon=0.657122 Action_times=4251708 Epoche=5817\n",
      "Epsilon=0.656850 Action_times=4255899 Epoche=5818\n",
      "Epsilon=0.656739 Action_times=4257622 Epoche=5819\n",
      "Epsilon=0.656701 Action_times=4258213 Epoche=5820\n",
      "Epsilon=0.656520 Action_times=4261003 Epoche=5821\n",
      "Epsilon=0.656487 Action_times=4261521 Epoche=5822\n",
      "Epsilon=0.656392 Action_times=4262987 Epoche=5823\n",
      "Epsilon=0.656380 Action_times=4263180 Epoche=5824\n",
      "Epsilon=0.656314 Action_times=4264191 Epoche=5825\n",
      "Epsilon=0.656234 Action_times=4265440 Epoche=5826\n",
      "Epsilon=0.656166 Action_times=4266485 Epoche=5827\n",
      "Epsilon=0.656097 Action_times=4267554 Epoche=5828\n",
      "Epsilon=0.656030 Action_times=4268589 Epoche=5829\n",
      "Epsilon=0.656013 Action_times=4268851 Epoche=5830\n",
      "Epsilon=0.655868 Action_times=4271092 Epoche=5831\n",
      "Epsilon=0.655784 Action_times=4272398 Epoche=5832\n",
      "Epsilon=0.655722 Action_times=4273361 Epoche=5833\n",
      "Epsilon=0.655688 Action_times=4273891 Epoche=5834\n",
      "Epsilon=0.655651 Action_times=4274454 Epoche=5835\n",
      "Epsilon=0.655547 Action_times=4276067 Epoche=5836\n",
      "Epsilon=0.655507 Action_times=4276692 Epoche=5837\n",
      "Epsilon=0.655431 Action_times=4277860 Epoche=5838\n",
      "Epsilon=0.655404 Action_times=4278281 Epoche=5839\n",
      "Epsilon=0.655339 Action_times=4279299 Epoche=5840\n",
      "Epsilon=0.655301 Action_times=4279886 Epoche=5841\n",
      "Epsilon=0.655267 Action_times=4280406 Epoche=5842\n",
      "Epsilon=0.655260 Action_times=4280519 Epoche=5843\n",
      "Epsilon=0.655216 Action_times=4281199 Epoche=5844\n",
      "Epsilon=0.655192 Action_times=4281563 Epoche=5845\n",
      "Epsilon=0.655122 Action_times=4282660 Epoche=5846\n",
      "Epsilon=0.655069 Action_times=4283480 Epoche=5847\n",
      "Epsilon=0.654932 Action_times=4285607 Epoche=5848\n",
      "Epsilon=0.654808 Action_times=4287524 Epoche=5849\n",
      "Epsilon=0.654759 Action_times=4288288 Epoche=5850\n",
      "Epsilon=0.654711 Action_times=4289021 Epoche=5851\n",
      "Epsilon=0.654681 Action_times=4289491 Epoche=5852\n",
      "Epsilon=0.654636 Action_times=4290185 Epoche=5853\n",
      "Epsilon=0.654566 Action_times=4291275 Epoche=5854\n",
      "Epsilon=0.654531 Action_times=4291821 Epoche=5855\n",
      "Epsilon=0.654492 Action_times=4292433 Epoche=5856\n",
      "Epsilon=0.654415 Action_times=4293627 Epoche=5857\n",
      "Epsilon=0.654323 Action_times=4295042 Epoche=5858\n",
      "Epsilon=0.654255 Action_times=4296103 Epoche=5859\n",
      "Epsilon=0.654190 Action_times=4297111 Epoche=5860\n",
      "Epsilon=0.654123 Action_times=4298145 Epoche=5861\n",
      "Epsilon=0.653995 Action_times=4300134 Epoche=5862\n",
      "Epsilon=0.653945 Action_times=4300923 Epoche=5863\n",
      "Epsilon=0.653778 Action_times=4303511 Epoche=5864\n",
      "Epsilon=0.653632 Action_times=4305778 Epoche=5865\n",
      "Epsilon=0.653588 Action_times=4306459 Epoche=5866\n",
      "Epsilon=0.653482 Action_times=4308108 Epoche=5867\n",
      "Epsilon=0.653394 Action_times=4309481 Epoche=5868\n",
      "Epsilon=0.653356 Action_times=4310060 Epoche=5869\n",
      "Epsilon=0.653307 Action_times=4310828 Epoche=5870\n",
      "Epsilon=0.653216 Action_times=4312243 Epoche=5871\n",
      "Epsilon=0.653136 Action_times=4313491 Epoche=5872\n",
      "Epsilon=0.653079 Action_times=4314368 Epoche=5873\n",
      "Epsilon=0.652963 Action_times=4316172 Epoche=5874\n",
      "Epsilon=0.652900 Action_times=4317160 Epoche=5875\n",
      "Epsilon=0.652827 Action_times=4318292 Epoche=5876\n",
      "Epsilon=0.652734 Action_times=4319746 Epoche=5877\n",
      "Epsilon=0.652658 Action_times=4320927 Epoche=5878\n",
      "Epsilon=0.652621 Action_times=4321499 Epoche=5879\n",
      "Epsilon=0.652530 Action_times=4322918 Epoche=5880\n",
      "Epsilon=0.652435 Action_times=4324386 Epoche=5881\n",
      "Epsilon=0.652375 Action_times=4325333 Epoche=5882\n",
      "Epsilon=0.652337 Action_times=4325920 Epoche=5883\n",
      "Epsilon=0.652247 Action_times=4327323 Epoche=5884\n",
      "Epsilon=0.652191 Action_times=4328194 Epoche=5885\n",
      "Epsilon=0.652138 Action_times=4329021 Epoche=5886\n",
      "Epsilon=0.652114 Action_times=4329398 Epoche=5887\n",
      "Epsilon=0.652020 Action_times=4330852 Epoche=5888\n",
      "Epsilon=0.651982 Action_times=4331447 Epoche=5889\n",
      "Epsilon=0.651942 Action_times=4332070 Epoche=5890\n",
      "Epsilon=0.651897 Action_times=4332774 Epoche=5891\n",
      "Epsilon=0.651818 Action_times=4333995 Epoche=5892\n",
      "Epsilon=0.651765 Action_times=4334820 Epoche=5893\n",
      "Epsilon=0.651686 Action_times=4336059 Epoche=5894\n",
      "Epsilon=0.651657 Action_times=4336518 Epoche=5895\n",
      "Epsilon=0.651625 Action_times=4337016 Epoche=5896\n",
      "Epsilon=0.651602 Action_times=4337360 Epoche=5897\n",
      "Epsilon=0.651592 Action_times=4337519 Epoche=5898\n",
      "Epsilon=0.651536 Action_times=4338401 Epoche=5899\n",
      "Epsilon=0.651501 Action_times=4338938 Epoche=5900\n",
      "Epsilon=0.651398 Action_times=4340541 Epoche=5901\n",
      "Epsilon=0.651326 Action_times=4341674 Epoche=5902\n",
      "Epsilon=0.651293 Action_times=4342192 Epoche=5903\n",
      "Epsilon=0.651213 Action_times=4343433 Epoche=5904\n",
      "Epsilon=0.651141 Action_times=4344549 Epoche=5905\n",
      "Epsilon=0.651115 Action_times=4344968 Epoche=5906\n",
      "Epsilon=0.651087 Action_times=4345402 Epoche=5907\n",
      "Epsilon=0.651041 Action_times=4346114 Epoche=5908\n",
      "Epsilon=0.650981 Action_times=4347045 Epoche=5909\n",
      "Epsilon=0.650857 Action_times=4348979 Epoche=5910\n",
      "Epsilon=0.650792 Action_times=4349998 Epoche=5911\n",
      "Epsilon=0.650677 Action_times=4351791 Epoche=5912\n",
      "Epsilon=0.650609 Action_times=4352852 Epoche=5913\n",
      "Epsilon=0.650559 Action_times=4353639 Epoche=5914\n",
      "Epsilon=0.650518 Action_times=4354283 Epoche=5915\n",
      "Epsilon=0.650379 Action_times=4356445 Epoche=5916\n",
      "Epsilon=0.650314 Action_times=4357455 Epoche=5917\n",
      "Epsilon=0.650200 Action_times=4359247 Epoche=5918\n",
      "Epsilon=0.650191 Action_times=4359384 Epoche=5919\n",
      "Epsilon=0.650164 Action_times=4359811 Epoche=5920\n",
      "Epsilon=0.650105 Action_times=4360730 Epoche=5921\n",
      "Epsilon=0.650043 Action_times=4361691 Epoche=5922\n",
      "Epsilon=0.650026 Action_times=4361965 Epoche=5923\n",
      "Epsilon=0.649936 Action_times=4363371 Epoche=5924\n",
      "Epsilon=0.649870 Action_times=4364394 Epoche=5925\n",
      "Epsilon=0.649760 Action_times=4366126 Epoche=5926\n",
      "Epsilon=0.649727 Action_times=4366631 Epoche=5927\n",
      "Epsilon=0.649586 Action_times=4368833 Epoche=5928\n",
      "Epsilon=0.649522 Action_times=4369833 Epoche=5929\n",
      "Epsilon=0.649433 Action_times=4371232 Epoche=5930\n",
      "Epsilon=0.649396 Action_times=4371816 Epoche=5931\n",
      "Epsilon=0.649283 Action_times=4373574 Epoche=5932\n",
      "Epsilon=0.649124 Action_times=4376072 Epoche=5933\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.649007 Action_times=4377890 Epoche=5934\n",
      "Epsilon=0.648930 Action_times=4379102 Epoche=5935\n",
      "Epsilon=0.648805 Action_times=4381055 Epoche=5936\n",
      "Epsilon=0.648759 Action_times=4381777 Epoche=5937\n",
      "Epsilon=0.648600 Action_times=4384259 Epoche=5938\n",
      "Epsilon=0.648556 Action_times=4384960 Epoche=5939\n",
      "Epsilon=0.648527 Action_times=4385411 Epoche=5940\n",
      "Epsilon=0.648519 Action_times=4385541 Epoche=5941\n",
      "Epsilon=0.648487 Action_times=4386041 Epoche=5942\n",
      "Epsilon=0.648427 Action_times=4386973 Epoche=5943\n",
      "Epsilon=0.648389 Action_times=4387578 Epoche=5944\n",
      "Epsilon=0.648369 Action_times=4387885 Epoche=5945\n",
      "Epsilon=0.648345 Action_times=4388256 Epoche=5946\n",
      "Epsilon=0.648321 Action_times=4388630 Epoche=5947\n",
      "Epsilon=0.648302 Action_times=4388938 Epoche=5948\n",
      "Epsilon=0.648252 Action_times=4389713 Epoche=5949\n",
      "Epsilon=0.648222 Action_times=4390187 Epoche=5950\n",
      "Epsilon=0.648203 Action_times=4390478 Epoche=5951\n",
      "Epsilon=0.648160 Action_times=4391156 Epoche=5952\n",
      "Epsilon=0.648085 Action_times=4392333 Epoche=5953\n",
      "Epsilon=0.648049 Action_times=4392897 Epoche=5954\n",
      "Epsilon=0.648004 Action_times=4393601 Epoche=5955\n",
      "Epsilon=0.647862 Action_times=4395831 Epoche=5956\n",
      "Epsilon=0.647830 Action_times=4396328 Epoche=5957\n",
      "Epsilon=0.647757 Action_times=4397473 Epoche=5958\n",
      "Epsilon=0.647714 Action_times=4398152 Epoche=5959\n",
      "Epsilon=0.647619 Action_times=4399642 Epoche=5960\n",
      "Epsilon=0.647529 Action_times=4401044 Epoche=5961\n",
      "Epsilon=0.647449 Action_times=4402310 Epoche=5962\n",
      "Epsilon=0.647341 Action_times=4404007 Epoche=5963\n",
      "Epsilon=0.647239 Action_times=4405597 Epoche=5964\n",
      "Epsilon=0.647137 Action_times=4407200 Epoche=5965\n",
      "Epsilon=0.647013 Action_times=4409151 Epoche=5966\n",
      "Epsilon=0.646937 Action_times=4410339 Epoche=5967\n",
      "Epsilon=0.646807 Action_times=4412390 Epoche=5968\n",
      "Epsilon=0.646775 Action_times=4412889 Epoche=5969\n",
      "Epsilon=0.646711 Action_times=4413886 Epoche=5970\n",
      "Epsilon=0.646562 Action_times=4416228 Epoche=5971\n",
      "Epsilon=0.646477 Action_times=4417566 Epoche=5972\n",
      "Epsilon=0.646348 Action_times=4419587 Epoche=5973\n",
      "Epsilon=0.646270 Action_times=4420824 Epoche=5974\n",
      "Epsilon=0.646185 Action_times=4422150 Epoche=5975\n",
      "Epsilon=0.646108 Action_times=4423364 Epoche=5976\n",
      "Epsilon=0.645959 Action_times=4425713 Epoche=5977\n",
      "Epsilon=0.645911 Action_times=4426468 Epoche=5978\n",
      "Epsilon=0.645838 Action_times=4427613 Epoche=5979\n",
      "Epsilon=0.645774 Action_times=4428623 Epoche=5980\n",
      "Epsilon=0.645560 Action_times=4431986 Epoche=5981\n",
      "Epsilon=0.645514 Action_times=4432705 Epoche=5982\n",
      "Epsilon=0.645396 Action_times=4434560 Epoche=5983\n",
      "Epsilon=0.645366 Action_times=4435035 Epoche=5984\n",
      "Epsilon=0.645210 Action_times=4437489 Epoche=5985\n",
      "Epsilon=0.645160 Action_times=4438275 Epoche=5986\n",
      "Epsilon=0.645072 Action_times=4439663 Epoche=5987\n",
      "Epsilon=0.645040 Action_times=4440169 Epoche=5988\n",
      "Epsilon=0.644987 Action_times=4441002 Epoche=5989\n",
      "Epsilon=0.644940 Action_times=4441749 Epoche=5990\n",
      "Epsilon=0.644873 Action_times=4442802 Epoche=5991\n",
      "Epsilon=0.644845 Action_times=4443234 Epoche=5992\n",
      "Epsilon=0.644801 Action_times=4443933 Epoche=5993\n",
      "Epsilon=0.644747 Action_times=4444783 Epoche=5994\n",
      "Epsilon=0.644715 Action_times=4445291 Epoche=5995\n",
      "Epsilon=0.644625 Action_times=4446709 Epoche=5996\n",
      "Epsilon=0.644619 Action_times=4446798 Epoche=5997\n",
      "Epsilon=0.644580 Action_times=4447412 Epoche=5998\n",
      "Epsilon=0.644531 Action_times=4448184 Epoche=5999\n",
      "2\n",
      "***********************************************************\n",
      "Succeed to initialize Q-Table!\n",
      "***********************************************************\n",
      "Epsilon=0.997172 Action_times=28609 Epoche=6000\n",
      "Epsilon=0.995843 Action_times=42080 Epoche=6001\n",
      "Epsilon=0.993788 Action_times=62942 Epoche=6002\n",
      "Epsilon=0.992590 Action_times=75133 Epoche=6003\n",
      "Epsilon=0.989628 Action_times=105323 Epoche=6004\n",
      "Epsilon=0.987654 Action_times=125491 Epoche=6005\n",
      "Epsilon=0.986366 Action_times=138672 Epoche=6006\n",
      "Epsilon=0.982830 Action_times=174953 Epoche=6007\n",
      "Epsilon=0.982146 Action_times=181991 Epoche=6008\n",
      "Epsilon=0.981278 Action_times=190927 Epoche=6009\n",
      "Epsilon=0.980578 Action_times=198132 Epoche=6010\n",
      "Epsilon=0.978907 Action_times=215368 Epoche=6011\n",
      "Epsilon=0.977122 Action_times=233805 Epoche=6012\n",
      "Epsilon=0.976607 Action_times=239133 Epoche=6013\n",
      "Epsilon=0.976009 Action_times=245318 Epoche=6014\n",
      "Epsilon=0.975053 Action_times=255222 Epoche=6015\n",
      "Epsilon=0.974589 Action_times=260032 Epoche=6016\n",
      "Epsilon=0.973803 Action_times=268181 Epoche=6017\n",
      "Epsilon=0.972979 Action_times=276733 Epoche=6018\n",
      "Epsilon=0.972233 Action_times=284483 Epoche=6019\n",
      "Epsilon=0.971946 Action_times=287471 Epoche=6020\n",
      "Epsilon=0.971621 Action_times=290849 Epoche=6021\n",
      "Epsilon=0.970643 Action_times=301017 Epoche=6022\n",
      "Epsilon=0.970266 Action_times=304945 Epoche=6023\n",
      "Epsilon=0.970100 Action_times=306680 Epoche=6024\n",
      "Epsilon=0.969398 Action_times=313994 Epoche=6025\n",
      "Epsilon=0.969103 Action_times=317061 Epoche=6026\n",
      "Epsilon=0.968877 Action_times=319426 Epoche=6027\n",
      "Epsilon=0.968275 Action_times=325698 Epoche=6028\n",
      "Epsilon=0.967433 Action_times=334493 Epoche=6029\n",
      "Epsilon=0.967117 Action_times=337794 Epoche=6030\n",
      "Epsilon=0.966982 Action_times=339208 Epoche=6031\n",
      "Epsilon=0.966603 Action_times=343165 Epoche=6032\n",
      "Epsilon=0.966563 Action_times=343588 Epoche=6033\n",
      "Epsilon=0.965882 Action_times=350707 Epoche=6034\n",
      "Epsilon=0.965606 Action_times=353592 Epoche=6035\n",
      "Epsilon=0.965332 Action_times=356458 Epoche=6036\n",
      "Epsilon=0.964661 Action_times=363486 Epoche=6037\n",
      "Epsilon=0.963692 Action_times=373646 Epoche=6038\n",
      "Epsilon=0.963061 Action_times=380261 Epoche=6039\n",
      "Epsilon=0.962497 Action_times=386175 Epoche=6040\n",
      "Epsilon=0.962248 Action_times=388796 Epoche=6041\n",
      "Epsilon=0.961622 Action_times=395368 Epoche=6042\n",
      "Epsilon=0.961242 Action_times=399365 Epoche=6043\n",
      "Epsilon=0.961060 Action_times=401277 Epoche=6044\n",
      "Epsilon=0.960847 Action_times=403514 Epoche=6045\n",
      "Epsilon=0.960498 Action_times=407190 Epoche=6046\n",
      "Epsilon=0.959718 Action_times=415399 Epoche=6047\n",
      "Epsilon=0.959593 Action_times=416714 Epoche=6048\n",
      "Epsilon=0.959324 Action_times=419553 Epoche=6049\n",
      "Epsilon=0.958851 Action_times=424532 Epoche=6050\n",
      "Epsilon=0.958598 Action_times=427197 Epoche=6051\n",
      "Epsilon=0.958361 Action_times=429699 Epoche=6052\n",
      "Epsilon=0.957767 Action_times=435964 Epoche=6053\n",
      "Epsilon=0.957583 Action_times=437908 Epoche=6054\n",
      "Epsilon=0.956878 Action_times=445347 Epoche=6055\n",
      "Epsilon=0.956642 Action_times=447841 Epoche=6056\n",
      "Epsilon=0.956440 Action_times=449974 Epoche=6057\n",
      "Epsilon=0.955723 Action_times=457548 Epoche=6058\n",
      "Epsilon=0.955618 Action_times=458666 Epoche=6059\n",
      "Epsilon=0.955125 Action_times=463873 Epoche=6060\n",
      "Epsilon=0.954954 Action_times=465689 Epoche=6061\n",
      "Epsilon=0.954633 Action_times=469083 Epoche=6062\n",
      "Epsilon=0.954053 Action_times=475227 Epoche=6063\n",
      "Epsilon=0.953646 Action_times=479536 Epoche=6064\n",
      "Epsilon=0.953236 Action_times=483883 Epoche=6065\n",
      "Epsilon=0.953163 Action_times=484653 Epoche=6066\n",
      "Epsilon=0.952922 Action_times=487211 Epoche=6067\n",
      "Epsilon=0.952577 Action_times=490876 Epoche=6068\n",
      "Epsilon=0.952420 Action_times=492540 Epoche=6069\n",
      "Epsilon=0.951772 Action_times=499419 Epoche=6070\n",
      "Epsilon=0.951567 Action_times=501596 Epoche=6071\n",
      "Epsilon=0.951211 Action_times=505371 Epoche=6072\n",
      "Epsilon=0.951101 Action_times=506543 Epoche=6073\n",
      "Epsilon=0.950931 Action_times=508347 Epoche=6074\n",
      "Epsilon=0.950456 Action_times=513400 Epoche=6075\n",
      "Epsilon=0.950349 Action_times=514540 Epoche=6076\n",
      "Epsilon=0.950082 Action_times=517382 Epoche=6077\n",
      "Epsilon=0.949749 Action_times=520917 Epoche=6078\n",
      "Epsilon=0.949660 Action_times=521870 Epoche=6079\n",
      "Epsilon=0.949463 Action_times=523967 Epoche=6080\n",
      "Epsilon=0.949258 Action_times=526144 Epoche=6081\n",
      "Epsilon=0.949110 Action_times=527719 Epoche=6082\n",
      "Epsilon=0.948741 Action_times=531651 Epoche=6083\n",
      "Epsilon=0.948391 Action_times=535381 Epoche=6084\n",
      "Epsilon=0.948290 Action_times=536458 Epoche=6085\n",
      "Epsilon=0.948149 Action_times=537964 Epoche=6086\n",
      "Epsilon=0.947988 Action_times=539677 Epoche=6087\n",
      "Epsilon=0.947608 Action_times=543725 Epoche=6088\n",
      "Epsilon=0.947550 Action_times=544352 Epoche=6089\n",
      "Epsilon=0.946896 Action_times=551323 Epoche=6090\n",
      "Epsilon=0.946735 Action_times=553041 Epoche=6091\n",
      "Epsilon=0.946479 Action_times=555777 Epoche=6092\n",
      "Epsilon=0.946301 Action_times=557680 Epoche=6093\n",
      "Epsilon=0.946070 Action_times=560150 Epoche=6094\n",
      "Epsilon=0.945270 Action_times=568698 Epoche=6095\n",
      "Epsilon=0.944855 Action_times=573139 Epoche=6096\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.944649 Action_times=575335 Epoche=6097\n",
      "Epsilon=0.944440 Action_times=577575 Epoche=6098\n",
      "Epsilon=0.944222 Action_times=579913 Epoche=6099\n",
      "Epsilon=0.944012 Action_times=582161 Epoche=6100\n",
      "Epsilon=0.943562 Action_times=586974 Epoche=6101\n",
      "Epsilon=0.943473 Action_times=587933 Epoche=6102\n",
      "Epsilon=0.942855 Action_times=594551 Epoche=6103\n",
      "Epsilon=0.942527 Action_times=598073 Epoche=6104\n",
      "Epsilon=0.941934 Action_times=604432 Epoche=6105\n",
      "Epsilon=0.941727 Action_times=606652 Epoche=6106\n",
      "Epsilon=0.941604 Action_times=607968 Epoche=6107\n",
      "Epsilon=0.941131 Action_times=613046 Epoche=6108\n",
      "Epsilon=0.940751 Action_times=617127 Epoche=6109\n",
      "Epsilon=0.940440 Action_times=620471 Epoche=6110\n",
      "Epsilon=0.940061 Action_times=624544 Epoche=6111\n",
      "Epsilon=0.939909 Action_times=626187 Epoche=6112\n",
      "Epsilon=0.939893 Action_times=626356 Epoche=6113\n",
      "Epsilon=0.939355 Action_times=632144 Epoche=6114\n",
      "Epsilon=0.939060 Action_times=635315 Epoche=6115\n",
      "Epsilon=0.938715 Action_times=639030 Epoche=6116\n",
      "Epsilon=0.938549 Action_times=640822 Epoche=6117\n",
      "Epsilon=0.938040 Action_times=646306 Epoche=6118\n",
      "Epsilon=0.937915 Action_times=647651 Epoche=6119\n",
      "Epsilon=0.937784 Action_times=649055 Epoche=6120\n",
      "Epsilon=0.937707 Action_times=649886 Epoche=6121\n",
      "Epsilon=0.937272 Action_times=654585 Epoche=6122\n",
      "Epsilon=0.937141 Action_times=655995 Epoche=6123\n",
      "Epsilon=0.936915 Action_times=658426 Epoche=6124\n",
      "Epsilon=0.936679 Action_times=660981 Epoche=6125\n",
      "Epsilon=0.936396 Action_times=664032 Epoche=6126\n",
      "Epsilon=0.936244 Action_times=665674 Epoche=6127\n",
      "Epsilon=0.936037 Action_times=667906 Epoche=6128\n",
      "Epsilon=0.935871 Action_times=669697 Epoche=6129\n",
      "Epsilon=0.935397 Action_times=674821 Epoche=6130\n",
      "Epsilon=0.935285 Action_times=676028 Epoche=6131\n",
      "Epsilon=0.934822 Action_times=681035 Epoche=6132\n",
      "Epsilon=0.934628 Action_times=683139 Epoche=6133\n",
      "Epsilon=0.934568 Action_times=683787 Epoche=6134\n",
      "Epsilon=0.934266 Action_times=687045 Epoche=6135\n",
      "Epsilon=0.933978 Action_times=690169 Epoche=6136\n",
      "Epsilon=0.933706 Action_times=693107 Epoche=6137\n",
      "Epsilon=0.933631 Action_times=693918 Epoche=6138\n",
      "Epsilon=0.933498 Action_times=695368 Epoche=6139\n",
      "Epsilon=0.933080 Action_times=699888 Epoche=6140\n",
      "Epsilon=0.932520 Action_times=705955 Epoche=6141\n",
      "Epsilon=0.932388 Action_times=707394 Epoche=6142\n",
      "Epsilon=0.931876 Action_times=712937 Epoche=6143\n",
      "Epsilon=0.931282 Action_times=719385 Epoche=6144\n",
      "Epsilon=0.931123 Action_times=721117 Epoche=6145\n",
      "Epsilon=0.930817 Action_times=724436 Epoche=6146\n",
      "Epsilon=0.930588 Action_times=726924 Epoche=6147\n",
      "Epsilon=0.930532 Action_times=727537 Epoche=6148\n",
      "Epsilon=0.930112 Action_times=732092 Epoche=6149\n",
      "Epsilon=0.929755 Action_times=735973 Epoche=6150\n",
      "Epsilon=0.929671 Action_times=736885 Epoche=6151\n",
      "Epsilon=0.929424 Action_times=739574 Epoche=6152\n",
      "Epsilon=0.929166 Action_times=742378 Epoche=6153\n",
      "Epsilon=0.928665 Action_times=747832 Epoche=6154\n",
      "Epsilon=0.928352 Action_times=751245 Epoche=6155\n",
      "Epsilon=0.928187 Action_times=753037 Epoche=6156\n",
      "Epsilon=0.928107 Action_times=753912 Epoche=6157\n",
      "Epsilon=0.927843 Action_times=756785 Epoche=6158\n",
      "Epsilon=0.927428 Action_times=761313 Epoche=6159\n",
      "Epsilon=0.927221 Action_times=763565 Epoche=6160\n",
      "Epsilon=0.926991 Action_times=766077 Epoche=6161\n",
      "Epsilon=0.926884 Action_times=767239 Epoche=6162\n",
      "Epsilon=0.926335 Action_times=773224 Epoche=6163\n",
      "Epsilon=0.926156 Action_times=775178 Epoche=6164\n",
      "Epsilon=0.925827 Action_times=778779 Epoche=6165\n",
      "Epsilon=0.925568 Action_times=781600 Epoche=6166\n",
      "Epsilon=0.925048 Action_times=787283 Epoche=6167\n",
      "Epsilon=0.924768 Action_times=790350 Epoche=6168\n",
      "Epsilon=0.924638 Action_times=791768 Epoche=6169\n",
      "Epsilon=0.924540 Action_times=792840 Epoche=6170\n",
      "Epsilon=0.924410 Action_times=794256 Epoche=6171\n",
      "Epsilon=0.924308 Action_times=795379 Epoche=6172\n",
      "Epsilon=0.923278 Action_times=806649 Epoche=6173\n",
      "Epsilon=0.922833 Action_times=811515 Epoche=6174\n",
      "Epsilon=0.922430 Action_times=815933 Epoche=6175\n",
      "Epsilon=0.922043 Action_times=820177 Epoche=6176\n",
      "Epsilon=0.921902 Action_times=821729 Epoche=6177\n",
      "Epsilon=0.921498 Action_times=826152 Epoche=6178\n",
      "Epsilon=0.921250 Action_times=828879 Epoche=6179\n",
      "Epsilon=0.921023 Action_times=831366 Epoche=6180\n",
      "Epsilon=0.920842 Action_times=833352 Epoche=6181\n",
      "Epsilon=0.920708 Action_times=834829 Epoche=6182\n",
      "Epsilon=0.920513 Action_times=836965 Epoche=6183\n",
      "Epsilon=0.920206 Action_times=840339 Epoche=6184\n",
      "Epsilon=0.919807 Action_times=844721 Epoche=6185\n",
      "Epsilon=0.919708 Action_times=845814 Epoche=6186\n",
      "Epsilon=0.919671 Action_times=846219 Epoche=6187\n",
      "Epsilon=0.919625 Action_times=846720 Epoche=6188\n",
      "Epsilon=0.919485 Action_times=848266 Epoche=6189\n",
      "Epsilon=0.919282 Action_times=850494 Epoche=6190\n",
      "Epsilon=0.919028 Action_times=853287 Epoche=6191\n",
      "Epsilon=0.918735 Action_times=856511 Epoche=6192\n",
      "Epsilon=0.918439 Action_times=859776 Epoche=6193\n",
      "Epsilon=0.918283 Action_times=861486 Epoche=6194\n",
      "Epsilon=0.918087 Action_times=863649 Epoche=6195\n",
      "Epsilon=0.917887 Action_times=865853 Epoche=6196\n",
      "Epsilon=0.917656 Action_times=868393 Epoche=6197\n",
      "Epsilon=0.917483 Action_times=870306 Epoche=6198\n",
      "Epsilon=0.917394 Action_times=871286 Epoche=6199\n",
      "Epsilon=0.917218 Action_times=873225 Epoche=6200\n",
      "Epsilon=0.917178 Action_times=873668 Epoche=6201\n",
      "Epsilon=0.917006 Action_times=875554 Epoche=6202\n",
      "Epsilon=0.916870 Action_times=877055 Epoche=6203\n",
      "Epsilon=0.916600 Action_times=880039 Epoche=6204\n",
      "Epsilon=0.916437 Action_times=881834 Epoche=6205\n",
      "Epsilon=0.916256 Action_times=883831 Epoche=6206\n",
      "Epsilon=0.916208 Action_times=884363 Epoche=6207\n",
      "Epsilon=0.915796 Action_times=888909 Epoche=6208\n",
      "Epsilon=0.915709 Action_times=889867 Epoche=6209\n",
      "Epsilon=0.915481 Action_times=892382 Epoche=6210\n",
      "Epsilon=0.915227 Action_times=895193 Epoche=6211\n",
      "Epsilon=0.915021 Action_times=897471 Epoche=6212\n",
      "Epsilon=0.914860 Action_times=899245 Epoche=6213\n",
      "Epsilon=0.914776 Action_times=900177 Epoche=6214\n",
      "Epsilon=0.914606 Action_times=902060 Epoche=6215\n",
      "Epsilon=0.914502 Action_times=903202 Epoche=6216\n",
      "Epsilon=0.914375 Action_times=904610 Epoche=6217\n",
      "Epsilon=0.914295 Action_times=905491 Epoche=6218\n",
      "Epsilon=0.913985 Action_times=908924 Epoche=6219\n",
      "Epsilon=0.913788 Action_times=911099 Epoche=6220\n",
      "Epsilon=0.913773 Action_times=911268 Epoche=6221\n",
      "Epsilon=0.913664 Action_times=912475 Epoche=6222\n",
      "Epsilon=0.913579 Action_times=913414 Epoche=6223\n",
      "Epsilon=0.913334 Action_times=916127 Epoche=6224\n",
      "Epsilon=0.913211 Action_times=917491 Epoche=6225\n",
      "Epsilon=0.912983 Action_times=920016 Epoche=6226\n",
      "Epsilon=0.912871 Action_times=921252 Epoche=6227\n",
      "Epsilon=0.912676 Action_times=923410 Epoche=6228\n",
      "Epsilon=0.912550 Action_times=924804 Epoche=6229\n",
      "Epsilon=0.912310 Action_times=927463 Epoche=6230\n",
      "Epsilon=0.912173 Action_times=928988 Epoche=6231\n",
      "Epsilon=0.911927 Action_times=931711 Epoche=6232\n",
      "Epsilon=0.911769 Action_times=933463 Epoche=6233\n",
      "Epsilon=0.911376 Action_times=937830 Epoche=6234\n",
      "Epsilon=0.910895 Action_times=943160 Epoche=6235\n",
      "Epsilon=0.910834 Action_times=943841 Epoche=6236\n",
      "Epsilon=0.910589 Action_times=946564 Epoche=6237\n",
      "Epsilon=0.910533 Action_times=947179 Epoche=6238\n",
      "Epsilon=0.910406 Action_times=948593 Epoche=6239\n",
      "Epsilon=0.910130 Action_times=951653 Epoche=6240\n",
      "Epsilon=0.909961 Action_times=953534 Epoche=6241\n",
      "Epsilon=0.909658 Action_times=956907 Epoche=6242\n",
      "Epsilon=0.909383 Action_times=959961 Epoche=6243\n",
      "Epsilon=0.909155 Action_times=962497 Epoche=6244\n",
      "Epsilon=0.908958 Action_times=964685 Epoche=6245\n",
      "Epsilon=0.908801 Action_times=966437 Epoche=6246\n",
      "Epsilon=0.908484 Action_times=969964 Epoche=6247\n",
      "Epsilon=0.908195 Action_times=973180 Epoche=6248\n",
      "Epsilon=0.907870 Action_times=976795 Epoche=6249\n",
      "Epsilon=0.907796 Action_times=977616 Epoche=6250\n",
      "Epsilon=0.907702 Action_times=978663 Epoche=6251\n",
      "Epsilon=0.907592 Action_times=979890 Epoche=6252\n",
      "Epsilon=0.907490 Action_times=981032 Epoche=6253\n",
      "Epsilon=0.907287 Action_times=983295 Epoche=6254\n",
      "Epsilon=0.907183 Action_times=984454 Epoche=6255\n",
      "Epsilon=0.907057 Action_times=985859 Epoche=6256\n",
      "Epsilon=0.906814 Action_times=988570 Epoche=6257\n",
      "Epsilon=0.906680 Action_times=990063 Epoche=6258\n",
      "Epsilon=0.906507 Action_times=991987 Epoche=6259\n",
      "Epsilon=0.906477 Action_times=992328 Epoche=6260\n",
      "Epsilon=0.906309 Action_times=994195 Epoche=6261\n",
      "Epsilon=0.906169 Action_times=995760 Epoche=6262\n",
      "Epsilon=0.906077 Action_times=996781 Epoche=6263\n",
      "Epsilon=0.905952 Action_times=998181 Epoche=6264\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.905703 Action_times=1000958 Epoche=6265\n",
      "Epsilon=0.905491 Action_times=1003330 Epoche=6266\n",
      "Epsilon=0.905432 Action_times=1003985 Epoche=6267\n",
      "Epsilon=0.905222 Action_times=1006337 Epoche=6268\n",
      "Epsilon=0.904988 Action_times=1008941 Epoche=6269\n",
      "Epsilon=0.904824 Action_times=1010776 Epoche=6270\n",
      "Epsilon=0.904672 Action_times=1012480 Epoche=6271\n",
      "Epsilon=0.904554 Action_times=1013794 Epoche=6272\n",
      "Epsilon=0.904441 Action_times=1015059 Epoche=6273\n",
      "Epsilon=0.904366 Action_times=1015895 Epoche=6274\n",
      "Epsilon=0.904161 Action_times=1018191 Epoche=6275\n",
      "Epsilon=0.904035 Action_times=1019598 Epoche=6276\n",
      "Epsilon=0.903922 Action_times=1020859 Epoche=6277\n",
      "Epsilon=0.903432 Action_times=1026346 Epoche=6278\n",
      "Epsilon=0.903133 Action_times=1029692 Epoche=6279\n",
      "Epsilon=0.902898 Action_times=1032325 Epoche=6280\n",
      "Epsilon=0.902682 Action_times=1034750 Epoche=6281\n",
      "Epsilon=0.902651 Action_times=1035090 Epoche=6282\n",
      "Epsilon=0.902616 Action_times=1035485 Epoche=6283\n",
      "Epsilon=0.902437 Action_times=1037488 Epoche=6284\n",
      "Epsilon=0.902281 Action_times=1039241 Epoche=6285\n",
      "Epsilon=0.902116 Action_times=1041084 Epoche=6286\n",
      "Epsilon=0.902055 Action_times=1041771 Epoche=6287\n",
      "Epsilon=0.901857 Action_times=1043989 Epoche=6288\n",
      "Epsilon=0.901442 Action_times=1048648 Epoche=6289\n",
      "Epsilon=0.901147 Action_times=1051954 Epoche=6290\n",
      "Epsilon=0.901061 Action_times=1052923 Epoche=6291\n",
      "Epsilon=0.900756 Action_times=1056346 Epoche=6292\n",
      "Epsilon=0.900475 Action_times=1059500 Epoche=6293\n",
      "Epsilon=0.900379 Action_times=1060573 Epoche=6294\n",
      "Epsilon=0.900345 Action_times=1060957 Epoche=6295\n",
      "Epsilon=0.900262 Action_times=1061894 Epoche=6296\n",
      "Epsilon=0.900236 Action_times=1062184 Epoche=6297\n",
      "Epsilon=0.900138 Action_times=1063280 Epoche=6298\n",
      "Epsilon=0.900078 Action_times=1063954 Epoche=6299\n",
      "Epsilon=0.900039 Action_times=1064399 Epoche=6300\n",
      "Epsilon=0.899999 Action_times=1064849 Epoche=6301\n",
      "Epsilon=0.899834 Action_times=1066702 Epoche=6302\n",
      "Epsilon=0.899617 Action_times=1069137 Epoche=6303\n",
      "Epsilon=0.899527 Action_times=1070147 Epoche=6304\n",
      "Epsilon=0.899273 Action_times=1073002 Epoche=6305\n",
      "Epsilon=0.899149 Action_times=1074397 Epoche=6306\n",
      "Epsilon=0.898887 Action_times=1077350 Epoche=6307\n",
      "Epsilon=0.898709 Action_times=1079350 Epoche=6308\n",
      "Epsilon=0.898644 Action_times=1080082 Epoche=6309\n",
      "Epsilon=0.898584 Action_times=1080757 Epoche=6310\n",
      "Epsilon=0.898539 Action_times=1081264 Epoche=6311\n",
      "Epsilon=0.898446 Action_times=1082314 Epoche=6312\n",
      "Epsilon=0.898396 Action_times=1082879 Epoche=6313\n",
      "Epsilon=0.898319 Action_times=1083745 Epoche=6314\n",
      "Epsilon=0.898093 Action_times=1086281 Epoche=6315\n",
      "Epsilon=0.897879 Action_times=1088700 Epoche=6316\n",
      "Epsilon=0.897743 Action_times=1090223 Epoche=6317\n",
      "Epsilon=0.897577 Action_times=1092095 Epoche=6318\n",
      "Epsilon=0.897352 Action_times=1094632 Epoche=6319\n",
      "Epsilon=0.897297 Action_times=1095250 Epoche=6320\n",
      "Epsilon=0.897102 Action_times=1097449 Epoche=6321\n",
      "Epsilon=0.896908 Action_times=1099642 Epoche=6322\n",
      "Epsilon=0.896667 Action_times=1102360 Epoche=6323\n",
      "Epsilon=0.896615 Action_times=1102936 Epoche=6324\n",
      "Epsilon=0.896321 Action_times=1106255 Epoche=6325\n",
      "Epsilon=0.895975 Action_times=1110165 Epoche=6326\n",
      "Epsilon=0.895878 Action_times=1111261 Epoche=6327\n",
      "Epsilon=0.895631 Action_times=1114044 Epoche=6328\n",
      "Epsilon=0.895338 Action_times=1117350 Epoche=6329\n",
      "Epsilon=0.895108 Action_times=1119950 Epoche=6330\n",
      "Epsilon=0.894937 Action_times=1121882 Epoche=6331\n",
      "Epsilon=0.894670 Action_times=1124904 Epoche=6332\n",
      "Epsilon=0.894467 Action_times=1127192 Epoche=6333\n",
      "Epsilon=0.894361 Action_times=1128400 Epoche=6334\n",
      "Epsilon=0.894200 Action_times=1130218 Epoche=6335\n",
      "Epsilon=0.893832 Action_times=1134376 Epoche=6336\n",
      "Epsilon=0.893528 Action_times=1137818 Epoche=6337\n",
      "Epsilon=0.893357 Action_times=1139756 Epoche=6338\n",
      "Epsilon=0.893192 Action_times=1141623 Epoche=6339\n",
      "Epsilon=0.893192 Action_times=1141628 Epoche=6340\n",
      "Epsilon=0.893054 Action_times=1143188 Epoche=6341\n",
      "Epsilon=0.892856 Action_times=1145428 Epoche=6342\n",
      "Epsilon=0.892787 Action_times=1146214 Epoche=6343\n",
      "Epsilon=0.892613 Action_times=1148179 Epoche=6344\n",
      "Epsilon=0.892317 Action_times=1151538 Epoche=6345\n",
      "Epsilon=0.892160 Action_times=1153318 Epoche=6346\n",
      "Epsilon=0.892102 Action_times=1153973 Epoche=6347\n",
      "Epsilon=0.891896 Action_times=1156310 Epoche=6348\n",
      "Epsilon=0.891786 Action_times=1157556 Epoche=6349\n",
      "Epsilon=0.891480 Action_times=1161030 Epoche=6350\n",
      "Epsilon=0.891157 Action_times=1164688 Epoche=6351\n",
      "Epsilon=0.890961 Action_times=1166912 Epoche=6352\n",
      "Epsilon=0.890940 Action_times=1167157 Epoche=6353\n",
      "Epsilon=0.890676 Action_times=1170149 Epoche=6354\n",
      "Epsilon=0.890493 Action_times=1172233 Epoche=6355\n",
      "Epsilon=0.890331 Action_times=1174065 Epoche=6356\n",
      "Epsilon=0.889910 Action_times=1178853 Epoche=6357\n",
      "Epsilon=0.889800 Action_times=1180109 Epoche=6358\n",
      "Epsilon=0.889449 Action_times=1184092 Epoche=6359\n",
      "Epsilon=0.889333 Action_times=1185412 Epoche=6360\n",
      "Epsilon=0.889110 Action_times=1187947 Epoche=6361\n",
      "Epsilon=0.889063 Action_times=1188484 Epoche=6362\n",
      "Epsilon=0.888910 Action_times=1190227 Epoche=6363\n",
      "Epsilon=0.888507 Action_times=1194812 Epoche=6364\n",
      "Epsilon=0.888429 Action_times=1195699 Epoche=6365\n",
      "Epsilon=0.888180 Action_times=1198533 Epoche=6366\n",
      "Epsilon=0.887892 Action_times=1201813 Epoche=6367\n",
      "Epsilon=0.887687 Action_times=1204151 Epoche=6368\n",
      "Epsilon=0.887377 Action_times=1207681 Epoche=6369\n",
      "Epsilon=0.886812 Action_times=1214118 Epoche=6370\n",
      "Epsilon=0.886694 Action_times=1215467 Epoche=6371\n",
      "Epsilon=0.886493 Action_times=1217760 Epoche=6372\n",
      "Epsilon=0.886332 Action_times=1219595 Epoche=6373\n",
      "Epsilon=0.886215 Action_times=1220929 Epoche=6374\n",
      "Epsilon=0.885956 Action_times=1223886 Epoche=6375\n",
      "Epsilon=0.885816 Action_times=1225484 Epoche=6376\n",
      "Epsilon=0.885425 Action_times=1229957 Epoche=6377\n",
      "Epsilon=0.885235 Action_times=1232120 Epoche=6378\n",
      "Epsilon=0.885007 Action_times=1234735 Epoche=6379\n",
      "Epsilon=0.884997 Action_times=1234845 Epoche=6380\n",
      "Epsilon=0.884748 Action_times=1237694 Epoche=6381\n",
      "Epsilon=0.884509 Action_times=1240418 Epoche=6382\n",
      "Epsilon=0.884280 Action_times=1243039 Epoche=6383\n",
      "Epsilon=0.884082 Action_times=1245309 Epoche=6384\n",
      "Epsilon=0.883938 Action_times=1246958 Epoche=6385\n",
      "Epsilon=0.883748 Action_times=1249134 Epoche=6386\n",
      "Epsilon=0.883085 Action_times=1256718 Epoche=6387\n",
      "Epsilon=0.882908 Action_times=1258750 Epoche=6388\n",
      "Epsilon=0.882734 Action_times=1260740 Epoche=6389\n",
      "Epsilon=0.882671 Action_times=1261462 Epoche=6390\n",
      "Epsilon=0.882398 Action_times=1264597 Epoche=6391\n",
      "Epsilon=0.882314 Action_times=1265556 Epoche=6392\n",
      "Epsilon=0.882075 Action_times=1268297 Epoche=6393\n",
      "Epsilon=0.882064 Action_times=1268419 Epoche=6394\n",
      "Epsilon=0.881843 Action_times=1270960 Epoche=6395\n",
      "Epsilon=0.881585 Action_times=1273921 Epoche=6396\n",
      "Epsilon=0.881233 Action_times=1277959 Epoche=6397\n",
      "Epsilon=0.881064 Action_times=1279890 Epoche=6398\n",
      "Epsilon=0.881062 Action_times=1279917 Epoche=6399\n",
      "Epsilon=0.880750 Action_times=1283503 Epoche=6400\n",
      "Epsilon=0.880554 Action_times=1285749 Epoche=6401\n",
      "Epsilon=0.880202 Action_times=1289801 Epoche=6402\n",
      "Epsilon=0.879962 Action_times=1292553 Epoche=6403\n",
      "Epsilon=0.879773 Action_times=1294730 Epoche=6404\n",
      "Epsilon=0.879467 Action_times=1298246 Epoche=6405\n",
      "Epsilon=0.879287 Action_times=1300312 Epoche=6406\n",
      "Epsilon=0.879123 Action_times=1302201 Epoche=6407\n",
      "Epsilon=0.878970 Action_times=1303961 Epoche=6408\n",
      "Epsilon=0.878672 Action_times=1307395 Epoche=6409\n",
      "Epsilon=0.878560 Action_times=1308677 Epoche=6410\n",
      "Epsilon=0.878383 Action_times=1310723 Epoche=6411\n",
      "Epsilon=0.878295 Action_times=1311740 Epoche=6412\n",
      "Epsilon=0.878041 Action_times=1314665 Epoche=6413\n",
      "Epsilon=0.877748 Action_times=1318039 Epoche=6414\n",
      "Epsilon=0.877479 Action_times=1321131 Epoche=6415\n",
      "Epsilon=0.877347 Action_times=1322663 Epoche=6416\n",
      "Epsilon=0.877195 Action_times=1324406 Epoche=6417\n",
      "Epsilon=0.876961 Action_times=1327104 Epoche=6418\n",
      "Epsilon=0.876620 Action_times=1331044 Epoche=6419\n",
      "Epsilon=0.876431 Action_times=1333225 Epoche=6420\n",
      "Epsilon=0.876219 Action_times=1335677 Epoche=6421\n",
      "Epsilon=0.876192 Action_times=1335982 Epoche=6422\n",
      "Epsilon=0.876146 Action_times=1336514 Epoche=6423\n",
      "Epsilon=0.875872 Action_times=1339682 Epoche=6424\n",
      "Epsilon=0.875753 Action_times=1341050 Epoche=6425\n",
      "Epsilon=0.875733 Action_times=1341283 Epoche=6426\n",
      "Epsilon=0.875638 Action_times=1342380 Epoche=6427\n",
      "Epsilon=0.875577 Action_times=1343085 Epoche=6428\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.875509 Action_times=1343874 Epoche=6429\n",
      "Epsilon=0.875268 Action_times=1346660 Epoche=6430\n",
      "Epsilon=0.875079 Action_times=1348840 Epoche=6431\n",
      "Epsilon=0.875027 Action_times=1349446 Epoche=6432\n",
      "Epsilon=0.874904 Action_times=1350864 Epoche=6433\n",
      "Epsilon=0.874786 Action_times=1352225 Epoche=6434\n",
      "Epsilon=0.874720 Action_times=1352996 Epoche=6435\n",
      "Epsilon=0.874547 Action_times=1354996 Epoche=6436\n",
      "Epsilon=0.874315 Action_times=1357674 Epoche=6437\n",
      "Epsilon=0.874139 Action_times=1359714 Epoche=6438\n",
      "Epsilon=0.873891 Action_times=1362580 Epoche=6439\n",
      "Epsilon=0.873812 Action_times=1363497 Epoche=6440\n",
      "Epsilon=0.873528 Action_times=1366785 Epoche=6441\n",
      "Epsilon=0.873186 Action_times=1370744 Epoche=6442\n",
      "Epsilon=0.873153 Action_times=1371134 Epoche=6443\n",
      "Epsilon=0.873146 Action_times=1371216 Epoche=6444\n",
      "Epsilon=0.873034 Action_times=1372509 Epoche=6445\n",
      "Epsilon=0.872873 Action_times=1374377 Epoche=6446\n",
      "Epsilon=0.872749 Action_times=1375809 Epoche=6447\n",
      "Epsilon=0.872598 Action_times=1377557 Epoche=6448\n",
      "Epsilon=0.872443 Action_times=1379356 Epoche=6449\n",
      "Epsilon=0.872377 Action_times=1380120 Epoche=6450\n",
      "Epsilon=0.872344 Action_times=1380511 Epoche=6451\n",
      "Epsilon=0.872187 Action_times=1382324 Epoche=6452\n",
      "Epsilon=0.872186 Action_times=1382340 Epoche=6453\n",
      "Epsilon=0.871921 Action_times=1385415 Epoche=6454\n",
      "Epsilon=0.871709 Action_times=1387878 Epoche=6455\n",
      "Epsilon=0.871510 Action_times=1390185 Epoche=6456\n",
      "Epsilon=0.871269 Action_times=1392986 Epoche=6457\n",
      "Epsilon=0.871182 Action_times=1393990 Epoche=6458\n",
      "Epsilon=0.870950 Action_times=1396686 Epoche=6459\n",
      "Epsilon=0.870716 Action_times=1399400 Epoche=6460\n",
      "Epsilon=0.870699 Action_times=1399605 Epoche=6461\n",
      "Epsilon=0.870511 Action_times=1401780 Epoche=6462\n",
      "Epsilon=0.870291 Action_times=1404337 Epoche=6463\n",
      "Epsilon=0.870121 Action_times=1406316 Epoche=6464\n",
      "Epsilon=0.869994 Action_times=1407792 Epoche=6465\n",
      "Epsilon=0.869668 Action_times=1411591 Epoche=6466\n",
      "Epsilon=0.869521 Action_times=1413299 Epoche=6467\n",
      "Epsilon=0.869329 Action_times=1415527 Epoche=6468\n",
      "Epsilon=0.869299 Action_times=1415883 Epoche=6469\n",
      "Epsilon=0.869156 Action_times=1417547 Epoche=6470\n",
      "Epsilon=0.868981 Action_times=1419584 Epoche=6471\n",
      "Epsilon=0.868939 Action_times=1420075 Epoche=6472\n",
      "Epsilon=0.868582 Action_times=1424228 Epoche=6473\n",
      "Epsilon=0.868365 Action_times=1426761 Epoche=6474\n",
      "Epsilon=0.868137 Action_times=1429415 Epoche=6475\n",
      "Epsilon=0.867936 Action_times=1431752 Epoche=6476\n",
      "Epsilon=0.867848 Action_times=1432778 Epoche=6477\n",
      "Epsilon=0.867642 Action_times=1435181 Epoche=6478\n",
      "Epsilon=0.867467 Action_times=1437227 Epoche=6479\n",
      "Epsilon=0.867281 Action_times=1439394 Epoche=6480\n",
      "Epsilon=0.866927 Action_times=1443526 Epoche=6481\n",
      "Epsilon=0.866738 Action_times=1445731 Epoche=6482\n",
      "Epsilon=0.866593 Action_times=1447418 Epoche=6483\n",
      "Epsilon=0.866370 Action_times=1450024 Epoche=6484\n",
      "Epsilon=0.866329 Action_times=1450503 Epoche=6485\n",
      "Epsilon=0.865890 Action_times=1455627 Epoche=6486\n",
      "Epsilon=0.865421 Action_times=1461114 Epoche=6487\n",
      "Epsilon=0.865282 Action_times=1462739 Epoche=6488\n",
      "Epsilon=0.865071 Action_times=1465206 Epoche=6489\n",
      "Epsilon=0.864763 Action_times=1468803 Epoche=6490\n",
      "Epsilon=0.864451 Action_times=1472463 Epoche=6491\n",
      "Epsilon=0.864252 Action_times=1474787 Epoche=6492\n",
      "Epsilon=0.864091 Action_times=1476672 Epoche=6493\n",
      "Epsilon=0.863834 Action_times=1479680 Epoche=6494\n",
      "Epsilon=0.863724 Action_times=1480971 Epoche=6495\n",
      "Epsilon=0.863540 Action_times=1483127 Epoche=6496\n",
      "Epsilon=0.863460 Action_times=1484063 Epoche=6497\n",
      "Epsilon=0.863338 Action_times=1485490 Epoche=6498\n",
      "Epsilon=0.863325 Action_times=1485645 Epoche=6499\n",
      "Epsilon=0.863186 Action_times=1487268 Epoche=6500\n",
      "Epsilon=0.862910 Action_times=1490514 Epoche=6501\n",
      "Epsilon=0.862627 Action_times=1493827 Epoche=6502\n",
      "Epsilon=0.862482 Action_times=1495534 Epoche=6503\n",
      "Epsilon=0.862322 Action_times=1497410 Epoche=6504\n",
      "Epsilon=0.862213 Action_times=1498685 Epoche=6505\n",
      "Epsilon=0.862010 Action_times=1501062 Epoche=6506\n",
      "Epsilon=0.861757 Action_times=1504040 Epoche=6507\n",
      "Epsilon=0.861728 Action_times=1504378 Epoche=6508\n",
      "Epsilon=0.861409 Action_times=1508124 Epoche=6509\n",
      "Epsilon=0.861375 Action_times=1508522 Epoche=6510\n",
      "Epsilon=0.861028 Action_times=1512600 Epoche=6511\n",
      "Epsilon=0.860841 Action_times=1514795 Epoche=6512\n",
      "Epsilon=0.860711 Action_times=1516322 Epoche=6513\n",
      "Epsilon=0.860651 Action_times=1517032 Epoche=6514\n",
      "Epsilon=0.860366 Action_times=1520381 Epoche=6515\n",
      "Epsilon=0.860129 Action_times=1523170 Epoche=6516\n",
      "Epsilon=0.859989 Action_times=1524821 Epoche=6517\n",
      "Epsilon=0.859833 Action_times=1526656 Epoche=6518\n",
      "Epsilon=0.859688 Action_times=1528356 Epoche=6519\n",
      "Epsilon=0.859660 Action_times=1528687 Epoche=6520\n",
      "Epsilon=0.859585 Action_times=1529573 Epoche=6521\n",
      "Epsilon=0.859432 Action_times=1531367 Epoche=6522\n",
      "Epsilon=0.859202 Action_times=1534079 Epoche=6523\n",
      "Epsilon=0.859110 Action_times=1535162 Epoche=6524\n",
      "Epsilon=0.859021 Action_times=1536207 Epoche=6525\n",
      "Epsilon=0.858813 Action_times=1538655 Epoche=6526\n",
      "Epsilon=0.858773 Action_times=1539137 Epoche=6527\n",
      "Epsilon=0.858721 Action_times=1539743 Epoche=6528\n",
      "Epsilon=0.858610 Action_times=1541048 Epoche=6529\n",
      "Epsilon=0.858383 Action_times=1543728 Epoche=6530\n",
      "Epsilon=0.858062 Action_times=1547512 Epoche=6531\n",
      "Epsilon=0.857917 Action_times=1549219 Epoche=6532\n",
      "Epsilon=0.857596 Action_times=1553011 Epoche=6533\n",
      "Epsilon=0.857346 Action_times=1555954 Epoche=6534\n",
      "Epsilon=0.857285 Action_times=1556679 Epoche=6535\n",
      "Epsilon=0.856958 Action_times=1560540 Epoche=6536\n",
      "Epsilon=0.856773 Action_times=1562717 Epoche=6537\n",
      "Epsilon=0.856651 Action_times=1564164 Epoche=6538\n",
      "Epsilon=0.856544 Action_times=1565426 Epoche=6539\n",
      "Epsilon=0.856395 Action_times=1567190 Epoche=6540\n",
      "Epsilon=0.856322 Action_times=1568047 Epoche=6541\n",
      "Epsilon=0.856181 Action_times=1569722 Epoche=6542\n",
      "Epsilon=0.856152 Action_times=1570064 Epoche=6543\n",
      "Epsilon=0.856008 Action_times=1571761 Epoche=6544\n",
      "Epsilon=0.855734 Action_times=1575004 Epoche=6545\n",
      "Epsilon=0.855669 Action_times=1575769 Epoche=6546\n",
      "Epsilon=0.855614 Action_times=1576420 Epoche=6547\n",
      "Epsilon=0.855533 Action_times=1577373 Epoche=6548\n",
      "Epsilon=0.855293 Action_times=1580217 Epoche=6549\n",
      "Epsilon=0.855176 Action_times=1581606 Epoche=6550\n",
      "Epsilon=0.855089 Action_times=1582634 Epoche=6551\n",
      "Epsilon=0.855026 Action_times=1583371 Epoche=6552\n",
      "Epsilon=0.854857 Action_times=1585370 Epoche=6553\n",
      "Epsilon=0.854653 Action_times=1587786 Epoche=6554\n",
      "Epsilon=0.854575 Action_times=1588716 Epoche=6555\n",
      "Epsilon=0.854472 Action_times=1589933 Epoche=6556\n",
      "Epsilon=0.854398 Action_times=1590810 Epoche=6557\n",
      "Epsilon=0.854241 Action_times=1592664 Epoche=6558\n",
      "Epsilon=0.854043 Action_times=1595013 Epoche=6559\n",
      "Epsilon=0.853805 Action_times=1597830 Epoche=6560\n",
      "Epsilon=0.853690 Action_times=1599199 Epoche=6561\n",
      "Epsilon=0.853476 Action_times=1601737 Epoche=6562\n",
      "Epsilon=0.853311 Action_times=1603692 Epoche=6563\n",
      "Epsilon=0.853202 Action_times=1604989 Epoche=6564\n",
      "Epsilon=0.853134 Action_times=1605785 Epoche=6565\n",
      "Epsilon=0.853034 Action_times=1606973 Epoche=6566\n",
      "Epsilon=0.852954 Action_times=1607923 Epoche=6567\n",
      "Epsilon=0.852859 Action_times=1609058 Epoche=6568\n",
      "Epsilon=0.852674 Action_times=1611244 Epoche=6569\n",
      "Epsilon=0.852574 Action_times=1612440 Epoche=6570\n",
      "Epsilon=0.852378 Action_times=1614766 Epoche=6571\n",
      "Epsilon=0.852278 Action_times=1615946 Epoche=6572\n",
      "Epsilon=0.851999 Action_times=1619256 Epoche=6573\n",
      "Epsilon=0.851907 Action_times=1620353 Epoche=6574\n",
      "Epsilon=0.851665 Action_times=1623231 Epoche=6575\n",
      "Epsilon=0.851489 Action_times=1625322 Epoche=6576\n",
      "Epsilon=0.851329 Action_times=1627226 Epoche=6577\n",
      "Epsilon=0.851167 Action_times=1629152 Epoche=6578\n",
      "Epsilon=0.851097 Action_times=1629985 Epoche=6579\n",
      "Epsilon=0.850980 Action_times=1631372 Epoche=6580\n",
      "Epsilon=0.850826 Action_times=1633199 Epoche=6581\n",
      "Epsilon=0.850697 Action_times=1634736 Epoche=6582\n",
      "Epsilon=0.850407 Action_times=1638187 Epoche=6583\n",
      "Epsilon=0.850337 Action_times=1639015 Epoche=6584\n",
      "Epsilon=0.850285 Action_times=1639641 Epoche=6585\n",
      "Epsilon=0.850062 Action_times=1642296 Epoche=6586\n",
      "Epsilon=0.850000 Action_times=1643036 Epoche=6587\n",
      "Epsilon=0.849902 Action_times=1644201 Epoche=6588\n",
      "Epsilon=0.849857 Action_times=1644737 Epoche=6589\n",
      "Epsilon=0.849725 Action_times=1646306 Epoche=6590\n",
      "Epsilon=0.849529 Action_times=1648638 Epoche=6591\n",
      "Epsilon=0.849451 Action_times=1649565 Epoche=6592\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.849394 Action_times=1650244 Epoche=6593\n",
      "Epsilon=0.849366 Action_times=1650577 Epoche=6594\n",
      "Epsilon=0.849226 Action_times=1652254 Epoche=6595\n",
      "Epsilon=0.849133 Action_times=1653356 Epoche=6596\n",
      "Epsilon=0.848968 Action_times=1655329 Epoche=6597\n",
      "Epsilon=0.848892 Action_times=1656229 Epoche=6598\n",
      "Epsilon=0.848549 Action_times=1660319 Epoche=6599\n",
      "Epsilon=0.848497 Action_times=1660934 Epoche=6600\n",
      "Epsilon=0.848419 Action_times=1661866 Epoche=6601\n",
      "Epsilon=0.848391 Action_times=1662203 Epoche=6602\n",
      "Epsilon=0.848331 Action_times=1662922 Epoche=6603\n",
      "Epsilon=0.848316 Action_times=1663103 Epoche=6604\n",
      "Epsilon=0.848282 Action_times=1663504 Epoche=6605\n",
      "Epsilon=0.848120 Action_times=1665434 Epoche=6606\n",
      "Epsilon=0.847705 Action_times=1670384 Epoche=6607\n",
      "Epsilon=0.847335 Action_times=1674809 Epoche=6608\n",
      "Epsilon=0.847107 Action_times=1677532 Epoche=6609\n",
      "Epsilon=0.847003 Action_times=1678772 Epoche=6610\n",
      "Epsilon=0.846970 Action_times=1679171 Epoche=6611\n",
      "Epsilon=0.846920 Action_times=1679768 Epoche=6612\n",
      "Epsilon=0.846794 Action_times=1681265 Epoche=6613\n",
      "Epsilon=0.846731 Action_times=1682024 Epoche=6614\n",
      "Epsilon=0.846567 Action_times=1683985 Epoche=6615\n",
      "Epsilon=0.846409 Action_times=1685874 Epoche=6616\n",
      "Epsilon=0.846405 Action_times=1685921 Epoche=6617\n",
      "Epsilon=0.846220 Action_times=1688130 Epoche=6618\n",
      "Epsilon=0.846166 Action_times=1688778 Epoche=6619\n",
      "Epsilon=0.846088 Action_times=1689710 Epoche=6620\n",
      "Epsilon=0.846003 Action_times=1690722 Epoche=6621\n",
      "Epsilon=0.845836 Action_times=1692725 Epoche=6622\n",
      "Epsilon=0.845731 Action_times=1693981 Epoche=6623\n",
      "Epsilon=0.845589 Action_times=1695679 Epoche=6624\n",
      "Epsilon=0.845332 Action_times=1698752 Epoche=6625\n",
      "Epsilon=0.845269 Action_times=1699512 Epoche=6626\n",
      "Epsilon=0.845051 Action_times=1702125 Epoche=6627\n",
      "Epsilon=0.844861 Action_times=1704394 Epoche=6628\n",
      "Epsilon=0.844781 Action_times=1705353 Epoche=6629\n",
      "Epsilon=0.844615 Action_times=1707340 Epoche=6630\n",
      "Epsilon=0.844544 Action_times=1708191 Epoche=6631\n",
      "Epsilon=0.844406 Action_times=1709854 Epoche=6632\n",
      "Epsilon=0.844188 Action_times=1712462 Epoche=6633\n",
      "Epsilon=0.843982 Action_times=1714927 Epoche=6634\n",
      "Epsilon=0.843892 Action_times=1716008 Epoche=6635\n",
      "Epsilon=0.843837 Action_times=1716666 Epoche=6636\n",
      "Epsilon=0.843738 Action_times=1717856 Epoche=6637\n",
      "Epsilon=0.843689 Action_times=1718448 Epoche=6638\n",
      "Epsilon=0.843682 Action_times=1718532 Epoche=6639\n",
      "Epsilon=0.843495 Action_times=1720773 Epoche=6640\n",
      "Epsilon=0.843414 Action_times=1721750 Epoche=6641\n",
      "Epsilon=0.843130 Action_times=1725150 Epoche=6642\n",
      "Epsilon=0.842735 Action_times=1729894 Epoche=6643\n",
      "Epsilon=0.842643 Action_times=1731004 Epoche=6644\n",
      "Epsilon=0.842446 Action_times=1733368 Epoche=6645\n",
      "Epsilon=0.842141 Action_times=1737028 Epoche=6646\n",
      "Epsilon=0.841922 Action_times=1739666 Epoche=6647\n",
      "Epsilon=0.841705 Action_times=1742268 Epoche=6648\n",
      "Epsilon=0.841493 Action_times=1744817 Epoche=6649\n",
      "Epsilon=0.841317 Action_times=1746941 Epoche=6650\n",
      "Epsilon=0.841108 Action_times=1749446 Epoche=6651\n",
      "Epsilon=0.841008 Action_times=1750653 Epoche=6652\n",
      "Epsilon=0.840891 Action_times=1752060 Epoche=6653\n",
      "Epsilon=0.840807 Action_times=1753074 Epoche=6654\n",
      "Epsilon=0.840756 Action_times=1753690 Epoche=6655\n",
      "Epsilon=0.840513 Action_times=1756616 Epoche=6656\n",
      "Epsilon=0.840457 Action_times=1757283 Epoche=6657\n",
      "Epsilon=0.840366 Action_times=1758386 Epoche=6658\n",
      "Epsilon=0.840307 Action_times=1759097 Epoche=6659\n",
      "Epsilon=0.840214 Action_times=1760218 Epoche=6660\n",
      "Epsilon=0.840140 Action_times=1761101 Epoche=6661\n",
      "Epsilon=0.839999 Action_times=1762802 Epoche=6662\n",
      "Epsilon=0.839932 Action_times=1763607 Epoche=6663\n",
      "Epsilon=0.839851 Action_times=1764582 Epoche=6664\n",
      "Epsilon=0.839726 Action_times=1766096 Epoche=6665\n",
      "Epsilon=0.839511 Action_times=1768683 Epoche=6666\n",
      "Epsilon=0.839316 Action_times=1771034 Epoche=6667\n",
      "Epsilon=0.838973 Action_times=1775171 Epoche=6668\n",
      "Epsilon=0.838877 Action_times=1776335 Epoche=6669\n",
      "Epsilon=0.838805 Action_times=1777203 Epoche=6670\n",
      "Epsilon=0.838735 Action_times=1778045 Epoche=6671\n",
      "Epsilon=0.838702 Action_times=1778439 Epoche=6672\n",
      "Epsilon=0.838586 Action_times=1779840 Epoche=6673\n",
      "Epsilon=0.838517 Action_times=1780677 Epoche=6674\n",
      "Epsilon=0.838400 Action_times=1782089 Epoche=6675\n",
      "Epsilon=0.838298 Action_times=1783325 Epoche=6676\n",
      "Epsilon=0.838221 Action_times=1784254 Epoche=6677\n",
      "Epsilon=0.838039 Action_times=1786452 Epoche=6678\n",
      "Epsilon=0.837915 Action_times=1787948 Epoche=6679\n",
      "Epsilon=0.837873 Action_times=1788457 Epoche=6680\n",
      "Epsilon=0.837655 Action_times=1791084 Epoche=6681\n",
      "Epsilon=0.837148 Action_times=1797211 Epoche=6682\n",
      "Epsilon=0.836977 Action_times=1799281 Epoche=6683\n",
      "Epsilon=0.836832 Action_times=1801039 Epoche=6684\n",
      "Epsilon=0.836669 Action_times=1803004 Epoche=6685\n",
      "Epsilon=0.836393 Action_times=1806348 Epoche=6686\n",
      "Epsilon=0.836293 Action_times=1807555 Epoche=6687\n",
      "Epsilon=0.836208 Action_times=1808587 Epoche=6688\n",
      "Epsilon=0.835981 Action_times=1811332 Epoche=6689\n",
      "Epsilon=0.835684 Action_times=1814925 Epoche=6690\n",
      "Epsilon=0.835460 Action_times=1817644 Epoche=6691\n",
      "Epsilon=0.835397 Action_times=1818410 Epoche=6692\n",
      "Epsilon=0.835183 Action_times=1820992 Epoche=6693\n",
      "Epsilon=0.835024 Action_times=1822925 Epoche=6694\n",
      "Epsilon=0.834877 Action_times=1824706 Epoche=6695\n",
      "Epsilon=0.834720 Action_times=1826605 Epoche=6696\n",
      "Epsilon=0.834551 Action_times=1828656 Epoche=6697\n",
      "Epsilon=0.834439 Action_times=1830014 Epoche=6698\n",
      "Epsilon=0.834351 Action_times=1831087 Epoche=6699\n",
      "Epsilon=0.834259 Action_times=1832203 Epoche=6700\n",
      "Epsilon=0.834097 Action_times=1834168 Epoche=6701\n",
      "Epsilon=0.834042 Action_times=1834838 Epoche=6702\n",
      "Epsilon=0.833946 Action_times=1836005 Epoche=6703\n",
      "Epsilon=0.833933 Action_times=1836152 Epoche=6704\n",
      "Epsilon=0.833899 Action_times=1836565 Epoche=6705\n",
      "Epsilon=0.833474 Action_times=1841730 Epoche=6706\n",
      "Epsilon=0.833218 Action_times=1844844 Epoche=6707\n",
      "Epsilon=0.833042 Action_times=1846982 Epoche=6708\n",
      "Epsilon=0.832921 Action_times=1848447 Epoche=6709\n",
      "Epsilon=0.832801 Action_times=1849906 Epoche=6710\n",
      "Epsilon=0.832650 Action_times=1851737 Epoche=6711\n",
      "Epsilon=0.832581 Action_times=1852579 Epoche=6712\n",
      "Epsilon=0.832449 Action_times=1854180 Epoche=6713\n",
      "Epsilon=0.832321 Action_times=1855743 Epoche=6714\n",
      "Epsilon=0.832318 Action_times=1855778 Epoche=6715\n",
      "Epsilon=0.832203 Action_times=1857176 Epoche=6716\n",
      "Epsilon=0.831984 Action_times=1859843 Epoche=6717\n",
      "Epsilon=0.831976 Action_times=1859935 Epoche=6718\n",
      "Epsilon=0.831922 Action_times=1860595 Epoche=6719\n",
      "Epsilon=0.831760 Action_times=1862560 Epoche=6720\n",
      "Epsilon=0.831651 Action_times=1863897 Epoche=6721\n",
      "Epsilon=0.831566 Action_times=1864926 Epoche=6722\n",
      "Epsilon=0.831503 Action_times=1865695 Epoche=6723\n",
      "Epsilon=0.831387 Action_times=1867100 Epoche=6724\n",
      "Epsilon=0.831331 Action_times=1867789 Epoche=6725\n",
      "Epsilon=0.831069 Action_times=1870979 Epoche=6726\n",
      "Epsilon=0.830923 Action_times=1872761 Epoche=6727\n",
      "Epsilon=0.830769 Action_times=1874637 Epoche=6728\n",
      "Epsilon=0.830695 Action_times=1875536 Epoche=6729\n",
      "Epsilon=0.830626 Action_times=1876369 Epoche=6730\n",
      "Epsilon=0.830537 Action_times=1877454 Epoche=6731\n",
      "Epsilon=0.830523 Action_times=1877629 Epoche=6732\n",
      "Epsilon=0.830482 Action_times=1878135 Epoche=6733\n",
      "Epsilon=0.830399 Action_times=1879145 Epoche=6734\n",
      "Epsilon=0.830270 Action_times=1880714 Epoche=6735\n",
      "Epsilon=0.830194 Action_times=1881645 Epoche=6736\n",
      "Epsilon=0.830114 Action_times=1882618 Epoche=6737\n",
      "Epsilon=0.830099 Action_times=1882795 Epoche=6738\n",
      "Epsilon=0.829995 Action_times=1884071 Epoche=6739\n",
      "Epsilon=0.829937 Action_times=1884774 Epoche=6740\n",
      "Epsilon=0.829820 Action_times=1886199 Epoche=6741\n",
      "Epsilon=0.829576 Action_times=1889173 Epoche=6742\n",
      "Epsilon=0.829510 Action_times=1889980 Epoche=6743\n",
      "Epsilon=0.829406 Action_times=1891253 Epoche=6744\n",
      "Epsilon=0.829301 Action_times=1892529 Epoche=6745\n",
      "Epsilon=0.829105 Action_times=1894925 Epoche=6746\n",
      "Epsilon=0.828943 Action_times=1896900 Epoche=6747\n",
      "Epsilon=0.828887 Action_times=1897583 Epoche=6748\n",
      "Epsilon=0.828747 Action_times=1899303 Epoche=6749\n",
      "Epsilon=0.828738 Action_times=1899404 Epoche=6750\n",
      "Epsilon=0.828722 Action_times=1899606 Epoche=6751\n",
      "Epsilon=0.828511 Action_times=1902178 Epoche=6752\n",
      "Epsilon=0.828426 Action_times=1903214 Epoche=6753\n",
      "Epsilon=0.828365 Action_times=1903971 Epoche=6754\n",
      "Epsilon=0.828286 Action_times=1904931 Epoche=6755\n",
      "Epsilon=0.828154 Action_times=1906549 Epoche=6756\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.828037 Action_times=1907976 Epoche=6757\n",
      "Epsilon=0.827967 Action_times=1908826 Epoche=6758\n",
      "Epsilon=0.827875 Action_times=1909955 Epoche=6759\n",
      "Epsilon=0.827684 Action_times=1912289 Epoche=6760\n",
      "Epsilon=0.827654 Action_times=1912651 Epoche=6761\n",
      "Epsilon=0.827652 Action_times=1912676 Epoche=6762\n",
      "Epsilon=0.827480 Action_times=1914789 Epoche=6763\n",
      "Epsilon=0.827421 Action_times=1915510 Epoche=6764\n",
      "Epsilon=0.827167 Action_times=1918616 Epoche=6765\n",
      "Epsilon=0.827104 Action_times=1919386 Epoche=6766\n",
      "Epsilon=0.826863 Action_times=1922336 Epoche=6767\n",
      "Epsilon=0.826766 Action_times=1923517 Epoche=6768\n",
      "Epsilon=0.826273 Action_times=1929565 Epoche=6769\n",
      "Epsilon=0.826093 Action_times=1931772 Epoche=6770\n",
      "Epsilon=0.826014 Action_times=1932729 Epoche=6771\n",
      "Epsilon=0.825843 Action_times=1934830 Epoche=6772\n",
      "Epsilon=0.825753 Action_times=1935931 Epoche=6773\n",
      "Epsilon=0.825557 Action_times=1938337 Epoche=6774\n",
      "Epsilon=0.825497 Action_times=1939077 Epoche=6775\n",
      "Epsilon=0.825481 Action_times=1939270 Epoche=6776\n",
      "Epsilon=0.825415 Action_times=1940082 Epoche=6777\n",
      "Epsilon=0.825242 Action_times=1942200 Epoche=6778\n",
      "Epsilon=0.824917 Action_times=1946184 Epoche=6779\n",
      "Epsilon=0.824840 Action_times=1947130 Epoche=6780\n",
      "Epsilon=0.824716 Action_times=1948659 Epoche=6781\n",
      "Epsilon=0.824545 Action_times=1950751 Epoche=6782\n",
      "Epsilon=0.824441 Action_times=1952034 Epoche=6783\n",
      "Epsilon=0.824275 Action_times=1954062 Epoche=6784\n",
      "Epsilon=0.824144 Action_times=1955677 Epoche=6785\n",
      "Epsilon=0.823948 Action_times=1958083 Epoche=6786\n",
      "Epsilon=0.823852 Action_times=1959266 Epoche=6787\n",
      "Epsilon=0.823686 Action_times=1961307 Epoche=6788\n",
      "Epsilon=0.823492 Action_times=1963691 Epoche=6789\n",
      "Epsilon=0.823480 Action_times=1963836 Epoche=6790\n",
      "Epsilon=0.823298 Action_times=1966078 Epoche=6791\n",
      "Epsilon=0.823158 Action_times=1967789 Epoche=6792\n",
      "Epsilon=0.823028 Action_times=1969395 Epoche=6793\n",
      "Epsilon=0.822933 Action_times=1970563 Epoche=6794\n",
      "Epsilon=0.822877 Action_times=1971246 Epoche=6795\n",
      "Epsilon=0.822803 Action_times=1972167 Epoche=6796\n",
      "Epsilon=0.822688 Action_times=1973579 Epoche=6797\n",
      "Epsilon=0.822536 Action_times=1975443 Epoche=6798\n",
      "Epsilon=0.822457 Action_times=1976415 Epoche=6799\n",
      "Epsilon=0.822025 Action_times=1981732 Epoche=6800\n",
      "Epsilon=0.821947 Action_times=1982700 Epoche=6801\n",
      "Epsilon=0.821801 Action_times=1984502 Epoche=6802\n",
      "Epsilon=0.821636 Action_times=1986525 Epoche=6803\n",
      "Epsilon=0.821541 Action_times=1987706 Epoche=6804\n",
      "Epsilon=0.821399 Action_times=1989445 Epoche=6805\n",
      "Epsilon=0.821200 Action_times=1991908 Epoche=6806\n",
      "Epsilon=0.821076 Action_times=1993436 Epoche=6807\n",
      "Epsilon=0.820956 Action_times=1994917 Epoche=6808\n",
      "Epsilon=0.820875 Action_times=1995908 Epoche=6809\n",
      "Epsilon=0.820796 Action_times=1996879 Epoche=6810\n",
      "Epsilon=0.820711 Action_times=1997930 Epoche=6811\n",
      "Epsilon=0.820628 Action_times=1998955 Epoche=6812\n",
      "Epsilon=0.820488 Action_times=2000685 Epoche=6813\n",
      "Epsilon=0.820423 Action_times=2001482 Epoche=6814\n",
      "Epsilon=0.820333 Action_times=2002601 Epoche=6815\n",
      "Epsilon=0.820323 Action_times=2002718 Epoche=6816\n",
      "Epsilon=0.820123 Action_times=2005189 Epoche=6817\n",
      "Epsilon=0.819954 Action_times=2007274 Epoche=6818\n",
      "Epsilon=0.819867 Action_times=2008345 Epoche=6819\n",
      "Epsilon=0.819742 Action_times=2009887 Epoche=6820\n",
      "Epsilon=0.819730 Action_times=2010038 Epoche=6821\n",
      "Epsilon=0.819613 Action_times=2011490 Epoche=6822\n",
      "Epsilon=0.819542 Action_times=2012369 Epoche=6823\n",
      "Epsilon=0.819439 Action_times=2013633 Epoche=6824\n",
      "Epsilon=0.819388 Action_times=2014269 Epoche=6825\n",
      "Epsilon=0.819145 Action_times=2017274 Epoche=6826\n",
      "Epsilon=0.819005 Action_times=2019000 Epoche=6827\n",
      "Epsilon=0.818908 Action_times=2020203 Epoche=6828\n",
      "Epsilon=0.818883 Action_times=2020505 Epoche=6829\n",
      "Epsilon=0.818740 Action_times=2022269 Epoche=6830\n",
      "Epsilon=0.818694 Action_times=2022839 Epoche=6831\n",
      "Epsilon=0.818523 Action_times=2024961 Epoche=6832\n",
      "Epsilon=0.818392 Action_times=2026579 Epoche=6833\n",
      "Epsilon=0.818379 Action_times=2026742 Epoche=6834\n",
      "Epsilon=0.818203 Action_times=2028921 Epoche=6835\n",
      "Epsilon=0.818175 Action_times=2029261 Epoche=6836\n",
      "Epsilon=0.817955 Action_times=2031983 Epoche=6837\n",
      "Epsilon=0.817839 Action_times=2033421 Epoche=6838\n",
      "Epsilon=0.817646 Action_times=2035811 Epoche=6839\n",
      "Epsilon=0.817531 Action_times=2037229 Epoche=6840\n",
      "Epsilon=0.817472 Action_times=2037970 Epoche=6841\n",
      "Epsilon=0.817397 Action_times=2038890 Epoche=6842\n",
      "Epsilon=0.817209 Action_times=2041226 Epoche=6843\n",
      "Epsilon=0.817154 Action_times=2041903 Epoche=6844\n",
      "Epsilon=0.816913 Action_times=2044889 Epoche=6845\n",
      "Epsilon=0.816526 Action_times=2049686 Epoche=6846\n",
      "Epsilon=0.816278 Action_times=2052758 Epoche=6847\n",
      "Epsilon=0.816088 Action_times=2055123 Epoche=6848\n",
      "Epsilon=0.816022 Action_times=2055939 Epoche=6849\n",
      "Epsilon=0.815767 Action_times=2059098 Epoche=6850\n",
      "Epsilon=0.815732 Action_times=2059532 Epoche=6851\n",
      "Epsilon=0.815513 Action_times=2062254 Epoche=6852\n",
      "Epsilon=0.815397 Action_times=2063691 Epoche=6853\n",
      "Epsilon=0.815132 Action_times=2066990 Epoche=6854\n",
      "Epsilon=0.815072 Action_times=2067727 Epoche=6855\n",
      "Epsilon=0.814978 Action_times=2068903 Epoche=6856\n",
      "Epsilon=0.814928 Action_times=2069516 Epoche=6857\n",
      "Epsilon=0.814676 Action_times=2072650 Epoche=6858\n",
      "Epsilon=0.814347 Action_times=2076747 Epoche=6859\n",
      "Epsilon=0.814250 Action_times=2077946 Epoche=6860\n",
      "Epsilon=0.814154 Action_times=2079142 Epoche=6861\n",
      "Epsilon=0.814077 Action_times=2080101 Epoche=6862\n",
      "Epsilon=0.814043 Action_times=2080527 Epoche=6863\n",
      "Epsilon=0.813963 Action_times=2081515 Epoche=6864\n",
      "Epsilon=0.813824 Action_times=2083248 Epoche=6865\n",
      "Epsilon=0.813771 Action_times=2083900 Epoche=6866\n",
      "Epsilon=0.813712 Action_times=2084639 Epoche=6867\n",
      "Epsilon=0.813634 Action_times=2085607 Epoche=6868\n",
      "Epsilon=0.813341 Action_times=2089256 Epoche=6869\n",
      "Epsilon=0.813247 Action_times=2090421 Epoche=6870\n",
      "Epsilon=0.813093 Action_times=2092349 Epoche=6871\n",
      "Epsilon=0.812909 Action_times=2094632 Epoche=6872\n",
      "Epsilon=0.812638 Action_times=2098010 Epoche=6873\n",
      "Epsilon=0.812438 Action_times=2100509 Epoche=6874\n",
      "Epsilon=0.812251 Action_times=2102831 Epoche=6875\n",
      "Epsilon=0.812129 Action_times=2104354 Epoche=6876\n",
      "Epsilon=0.812073 Action_times=2105052 Epoche=6877\n",
      "Epsilon=0.811982 Action_times=2106183 Epoche=6878\n",
      "Epsilon=0.811912 Action_times=2107058 Epoche=6879\n",
      "Epsilon=0.811845 Action_times=2107892 Epoche=6880\n",
      "Epsilon=0.811726 Action_times=2109375 Epoche=6881\n",
      "Epsilon=0.811701 Action_times=2109693 Epoche=6882\n",
      "Epsilon=0.811608 Action_times=2110851 Epoche=6883\n",
      "Epsilon=0.811486 Action_times=2112379 Epoche=6884\n",
      "Epsilon=0.811310 Action_times=2114568 Epoche=6885\n",
      "Epsilon=0.811231 Action_times=2115560 Epoche=6886\n",
      "Epsilon=0.811229 Action_times=2115582 Epoche=6887\n",
      "Epsilon=0.811150 Action_times=2116564 Epoche=6888\n",
      "Epsilon=0.811092 Action_times=2117294 Epoche=6889\n",
      "Epsilon=0.810928 Action_times=2119337 Epoche=6890\n",
      "Epsilon=0.810793 Action_times=2121023 Epoche=6891\n",
      "Epsilon=0.810697 Action_times=2122218 Epoche=6892\n",
      "Epsilon=0.810613 Action_times=2123267 Epoche=6893\n",
      "Epsilon=0.810560 Action_times=2123930 Epoche=6894\n",
      "Epsilon=0.810440 Action_times=2125433 Epoche=6895\n",
      "Epsilon=0.810432 Action_times=2125537 Epoche=6896\n",
      "Epsilon=0.810406 Action_times=2125857 Epoche=6897\n",
      "Epsilon=0.810250 Action_times=2127810 Epoche=6898\n",
      "Epsilon=0.810191 Action_times=2128550 Epoche=6899\n",
      "Epsilon=0.810068 Action_times=2130079 Epoche=6900\n",
      "Epsilon=0.809946 Action_times=2131612 Epoche=6901\n",
      "Epsilon=0.809822 Action_times=2133152 Epoche=6902\n",
      "Epsilon=0.809715 Action_times=2134498 Epoche=6903\n",
      "Epsilon=0.809481 Action_times=2137418 Epoche=6904\n",
      "Epsilon=0.809384 Action_times=2138641 Epoche=6905\n",
      "Epsilon=0.809053 Action_times=2142773 Epoche=6906\n",
      "Epsilon=0.808919 Action_times=2144451 Epoche=6907\n",
      "Epsilon=0.808869 Action_times=2145079 Epoche=6908\n",
      "Epsilon=0.808844 Action_times=2145392 Epoche=6909\n",
      "Epsilon=0.808834 Action_times=2145513 Epoche=6910\n",
      "Epsilon=0.808793 Action_times=2146035 Epoche=6911\n",
      "Epsilon=0.808776 Action_times=2146246 Epoche=6912\n",
      "Epsilon=0.808639 Action_times=2147953 Epoche=6913\n",
      "Epsilon=0.808468 Action_times=2150095 Epoche=6914\n",
      "Epsilon=0.808403 Action_times=2150910 Epoche=6915\n",
      "Epsilon=0.808356 Action_times=2151498 Epoche=6916\n",
      "Epsilon=0.808252 Action_times=2152807 Epoche=6917\n",
      "Epsilon=0.808202 Action_times=2153432 Epoche=6918\n",
      "Epsilon=0.808144 Action_times=2154162 Epoche=6919\n",
      "Epsilon=0.808127 Action_times=2154375 Epoche=6920\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.808063 Action_times=2155178 Epoche=6921\n",
      "Epsilon=0.808008 Action_times=2155864 Epoche=6922\n",
      "Epsilon=0.807967 Action_times=2156380 Epoche=6923\n",
      "Epsilon=0.807716 Action_times=2159518 Epoche=6924\n",
      "Epsilon=0.807707 Action_times=2159639 Epoche=6925\n",
      "Epsilon=0.807531 Action_times=2161840 Epoche=6926\n",
      "Epsilon=0.807409 Action_times=2163377 Epoche=6927\n",
      "Epsilon=0.807357 Action_times=2164025 Epoche=6928\n",
      "Epsilon=0.807263 Action_times=2165206 Epoche=6929\n",
      "Epsilon=0.807193 Action_times=2166081 Epoche=6930\n",
      "Epsilon=0.807092 Action_times=2167347 Epoche=6931\n",
      "Epsilon=0.806953 Action_times=2169094 Epoche=6932\n",
      "Epsilon=0.806904 Action_times=2169706 Epoche=6933\n",
      "Epsilon=0.806828 Action_times=2170659 Epoche=6934\n",
      "Epsilon=0.806769 Action_times=2171406 Epoche=6935\n",
      "Epsilon=0.806502 Action_times=2174759 Epoche=6936\n",
      "Epsilon=0.806307 Action_times=2177200 Epoche=6937\n",
      "Epsilon=0.806137 Action_times=2179339 Epoche=6938\n",
      "Epsilon=0.806045 Action_times=2180491 Epoche=6939\n",
      "Epsilon=0.805993 Action_times=2181146 Epoche=6940\n",
      "Epsilon=0.805922 Action_times=2182033 Epoche=6941\n",
      "Epsilon=0.805880 Action_times=2182569 Epoche=6942\n",
      "Epsilon=0.805732 Action_times=2184425 Epoche=6943\n",
      "Epsilon=0.805588 Action_times=2186239 Epoche=6944\n",
      "Epsilon=0.805472 Action_times=2187697 Epoche=6945\n",
      "Epsilon=0.805170 Action_times=2191484 Epoche=6946\n",
      "Epsilon=0.804998 Action_times=2193654 Epoche=6947\n",
      "Epsilon=0.804809 Action_times=2196031 Epoche=6948\n",
      "Epsilon=0.804560 Action_times=2199166 Epoche=6949\n",
      "Epsilon=0.804263 Action_times=2202907 Epoche=6950\n",
      "Epsilon=0.804138 Action_times=2204481 Epoche=6951\n",
      "Epsilon=0.804087 Action_times=2205121 Epoche=6952\n",
      "Epsilon=0.804013 Action_times=2206056 Epoche=6953\n",
      "Epsilon=0.803876 Action_times=2207776 Epoche=6954\n",
      "Epsilon=0.803761 Action_times=2209222 Epoche=6955\n",
      "Epsilon=0.803722 Action_times=2209712 Epoche=6956\n",
      "Epsilon=0.803694 Action_times=2210069 Epoche=6957\n",
      "Epsilon=0.803654 Action_times=2210571 Epoche=6958\n",
      "Epsilon=0.803552 Action_times=2211863 Epoche=6959\n",
      "Epsilon=0.803458 Action_times=2213049 Epoche=6960\n",
      "Epsilon=0.803180 Action_times=2216553 Epoche=6961\n",
      "Epsilon=0.802977 Action_times=2219113 Epoche=6962\n",
      "Epsilon=0.802964 Action_times=2219273 Epoche=6963\n",
      "Epsilon=0.802877 Action_times=2220367 Epoche=6964\n",
      "Epsilon=0.802763 Action_times=2221802 Epoche=6965\n",
      "Epsilon=0.802624 Action_times=2223566 Epoche=6966\n",
      "Epsilon=0.802535 Action_times=2224684 Epoche=6967\n",
      "Epsilon=0.802375 Action_times=2226701 Epoche=6968\n",
      "Epsilon=0.802340 Action_times=2227143 Epoche=6969\n",
      "Epsilon=0.802213 Action_times=2228745 Epoche=6970\n",
      "Epsilon=0.802177 Action_times=2229198 Epoche=6971\n",
      "Epsilon=0.802129 Action_times=2229810 Epoche=6972\n",
      "Epsilon=0.802070 Action_times=2230555 Epoche=6973\n",
      "Epsilon=0.801914 Action_times=2232521 Epoche=6974\n",
      "Epsilon=0.801864 Action_times=2233153 Epoche=6975\n",
      "Epsilon=0.801822 Action_times=2233685 Epoche=6976\n",
      "Epsilon=0.801787 Action_times=2234125 Epoche=6977\n",
      "Epsilon=0.801666 Action_times=2235654 Epoche=6978\n",
      "Epsilon=0.801609 Action_times=2236379 Epoche=6979\n",
      "Epsilon=0.801471 Action_times=2238113 Epoche=6980\n",
      "Epsilon=0.801418 Action_times=2238793 Epoche=6981\n",
      "Epsilon=0.801101 Action_times=2242795 Epoche=6982\n",
      "Epsilon=0.801083 Action_times=2243023 Epoche=6983\n",
      "Epsilon=0.800972 Action_times=2244424 Epoche=6984\n",
      "Epsilon=0.800920 Action_times=2245077 Epoche=6985\n",
      "Epsilon=0.800806 Action_times=2246520 Epoche=6986\n",
      "Epsilon=0.800576 Action_times=2249431 Epoche=6987\n",
      "Epsilon=0.800538 Action_times=2249914 Epoche=6988\n",
      "Epsilon=0.800435 Action_times=2251210 Epoche=6989\n",
      "Epsilon=0.800434 Action_times=2251224 Epoche=6990\n",
      "Epsilon=0.800370 Action_times=2252037 Epoche=6991\n",
      "Epsilon=0.800185 Action_times=2254375 Epoche=6992\n",
      "Epsilon=0.800063 Action_times=2255920 Epoche=6993\n",
      "Epsilon=0.800029 Action_times=2256359 Epoche=6994\n",
      "Epsilon=0.799905 Action_times=2257921 Epoche=6995\n",
      "Epsilon=0.799717 Action_times=2260298 Epoche=6996\n",
      "Epsilon=0.799524 Action_times=2262741 Epoche=6997\n",
      "Epsilon=0.799387 Action_times=2264483 Epoche=6998\n",
      "Epsilon=0.799107 Action_times=2268031 Epoche=6999\n",
      "Epsilon=0.799077 Action_times=2268415 Epoche=7000\n",
      "Epsilon=0.798995 Action_times=2269449 Epoche=7001\n",
      "Epsilon=0.798701 Action_times=2273182 Epoche=7002\n",
      "Epsilon=0.798513 Action_times=2275555 Epoche=7003\n",
      "Epsilon=0.798466 Action_times=2276154 Epoche=7004\n",
      "Epsilon=0.798318 Action_times=2278029 Epoche=7005\n",
      "Epsilon=0.798255 Action_times=2278827 Epoche=7006\n",
      "Epsilon=0.798211 Action_times=2279393 Epoche=7007\n",
      "Epsilon=0.798141 Action_times=2280274 Epoche=7008\n",
      "Epsilon=0.797984 Action_times=2282270 Epoche=7009\n",
      "Epsilon=0.797900 Action_times=2283343 Epoche=7010\n",
      "Epsilon=0.797687 Action_times=2286041 Epoche=7011\n",
      "Epsilon=0.797628 Action_times=2286787 Epoche=7012\n",
      "Epsilon=0.797416 Action_times=2289482 Epoche=7013\n",
      "Epsilon=0.797207 Action_times=2292132 Epoche=7014\n",
      "Epsilon=0.797093 Action_times=2293580 Epoche=7015\n",
      "Epsilon=0.797030 Action_times=2294382 Epoche=7016\n",
      "Epsilon=0.796993 Action_times=2294861 Epoche=7017\n",
      "Epsilon=0.796846 Action_times=2296720 Epoche=7018\n",
      "Epsilon=0.796774 Action_times=2297637 Epoche=7019\n",
      "Epsilon=0.796740 Action_times=2298073 Epoche=7020\n",
      "Epsilon=0.796624 Action_times=2299545 Epoche=7021\n",
      "Epsilon=0.796482 Action_times=2301346 Epoche=7022\n",
      "Epsilon=0.796350 Action_times=2303033 Epoche=7023\n",
      "Epsilon=0.796179 Action_times=2305199 Epoche=7024\n",
      "Epsilon=0.796094 Action_times=2306284 Epoche=7025\n",
      "Epsilon=0.795912 Action_times=2308598 Epoche=7026\n",
      "Epsilon=0.795811 Action_times=2309885 Epoche=7027\n",
      "Epsilon=0.795751 Action_times=2310652 Epoche=7028\n",
      "Epsilon=0.795735 Action_times=2310850 Epoche=7029\n",
      "Epsilon=0.795684 Action_times=2311509 Epoche=7030\n",
      "Epsilon=0.795628 Action_times=2312210 Epoche=7031\n",
      "Epsilon=0.795512 Action_times=2313691 Epoche=7032\n",
      "Epsilon=0.795511 Action_times=2313707 Epoche=7033\n",
      "Epsilon=0.795364 Action_times=2315572 Epoche=7034\n",
      "Epsilon=0.795320 Action_times=2316138 Epoche=7035\n",
      "Epsilon=0.795218 Action_times=2317431 Epoche=7036\n",
      "Epsilon=0.795113 Action_times=2318767 Epoche=7037\n",
      "Epsilon=0.795082 Action_times=2319168 Epoche=7038\n",
      "Epsilon=0.795078 Action_times=2319213 Epoche=7039\n",
      "Epsilon=0.795041 Action_times=2319685 Epoche=7040\n",
      "Epsilon=0.794946 Action_times=2320905 Epoche=7041\n",
      "Epsilon=0.794777 Action_times=2323055 Epoche=7042\n",
      "Epsilon=0.794750 Action_times=2323392 Epoche=7043\n",
      "Epsilon=0.794654 Action_times=2324617 Epoche=7044\n",
      "Epsilon=0.794501 Action_times=2326570 Epoche=7045\n",
      "Epsilon=0.794457 Action_times=2327133 Epoche=7046\n",
      "Epsilon=0.794339 Action_times=2328634 Epoche=7047\n",
      "Epsilon=0.794299 Action_times=2329145 Epoche=7048\n",
      "Epsilon=0.794258 Action_times=2329671 Epoche=7049\n",
      "Epsilon=0.794154 Action_times=2330991 Epoche=7050\n",
      "Epsilon=0.794124 Action_times=2331376 Epoche=7051\n",
      "Epsilon=0.794093 Action_times=2331771 Epoche=7052\n",
      "Epsilon=0.794006 Action_times=2332878 Epoche=7053\n",
      "Epsilon=0.793865 Action_times=2334681 Epoche=7054\n",
      "Epsilon=0.793781 Action_times=2335751 Epoche=7055\n",
      "Epsilon=0.793758 Action_times=2336047 Epoche=7056\n",
      "Epsilon=0.793742 Action_times=2336250 Epoche=7057\n",
      "Epsilon=0.793558 Action_times=2338594 Epoche=7058\n",
      "Epsilon=0.793427 Action_times=2340267 Epoche=7059\n",
      "Epsilon=0.793242 Action_times=2342633 Epoche=7060\n",
      "Epsilon=0.793009 Action_times=2345602 Epoche=7061\n",
      "Epsilon=0.792848 Action_times=2347665 Epoche=7062\n",
      "Epsilon=0.792755 Action_times=2348852 Epoche=7063\n",
      "Epsilon=0.792737 Action_times=2349079 Epoche=7064\n",
      "Epsilon=0.792661 Action_times=2350057 Epoche=7065\n",
      "Epsilon=0.792534 Action_times=2351673 Epoche=7066\n",
      "Epsilon=0.792472 Action_times=2352471 Epoche=7067\n",
      "Epsilon=0.792389 Action_times=2353534 Epoche=7068\n",
      "Epsilon=0.792241 Action_times=2355419 Epoche=7069\n",
      "Epsilon=0.792017 Action_times=2358279 Epoche=7070\n",
      "Epsilon=0.791915 Action_times=2359583 Epoche=7071\n",
      "Epsilon=0.791774 Action_times=2361395 Epoche=7072\n",
      "Epsilon=0.791746 Action_times=2361749 Epoche=7073\n",
      "Epsilon=0.791576 Action_times=2363928 Epoche=7074\n",
      "Epsilon=0.791515 Action_times=2364700 Epoche=7075\n",
      "Epsilon=0.791446 Action_times=2365590 Epoche=7076\n",
      "Epsilon=0.791231 Action_times=2368338 Epoche=7077\n",
      "Epsilon=0.791205 Action_times=2368668 Epoche=7078\n",
      "Epsilon=0.791107 Action_times=2369927 Epoche=7079\n",
      "Epsilon=0.791027 Action_times=2370958 Epoche=7080\n",
      "Epsilon=0.790815 Action_times=2373664 Epoche=7081\n",
      "Epsilon=0.790742 Action_times=2374599 Epoche=7082\n",
      "Epsilon=0.790643 Action_times=2375875 Epoche=7083\n",
      "Epsilon=0.790480 Action_times=2377964 Epoche=7084\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.790336 Action_times=2379802 Epoche=7085\n",
      "Epsilon=0.790213 Action_times=2381378 Epoche=7086\n",
      "Epsilon=0.790146 Action_times=2382236 Epoche=7087\n",
      "Epsilon=0.790128 Action_times=2382467 Epoche=7088\n",
      "Epsilon=0.790056 Action_times=2383392 Epoche=7089\n",
      "Epsilon=0.790033 Action_times=2383683 Epoche=7090\n",
      "Epsilon=0.789984 Action_times=2384311 Epoche=7091\n",
      "Epsilon=0.789925 Action_times=2385077 Epoche=7092\n",
      "Epsilon=0.789793 Action_times=2386769 Epoche=7093\n",
      "Epsilon=0.789735 Action_times=2387514 Epoche=7094\n",
      "Epsilon=0.789651 Action_times=2388588 Epoche=7095\n",
      "Epsilon=0.789534 Action_times=2390091 Epoche=7096\n",
      "Epsilon=0.789500 Action_times=2390519 Epoche=7097\n",
      "Epsilon=0.789400 Action_times=2391804 Epoche=7098\n",
      "Epsilon=0.789269 Action_times=2393481 Epoche=7099\n",
      "Epsilon=0.789047 Action_times=2396333 Epoche=7100\n",
      "Epsilon=0.788901 Action_times=2398209 Epoche=7101\n",
      "Epsilon=0.788819 Action_times=2399264 Epoche=7102\n",
      "Epsilon=0.788686 Action_times=2400974 Epoche=7103\n",
      "Epsilon=0.788624 Action_times=2401763 Epoche=7104\n",
      "Epsilon=0.788572 Action_times=2402440 Epoche=7105\n",
      "Epsilon=0.788447 Action_times=2404044 Epoche=7106\n",
      "Epsilon=0.788371 Action_times=2405011 Epoche=7107\n",
      "Epsilon=0.788324 Action_times=2405623 Epoche=7108\n",
      "Epsilon=0.788284 Action_times=2406134 Epoche=7109\n",
      "Epsilon=0.788070 Action_times=2408879 Epoche=7110\n",
      "Epsilon=0.787909 Action_times=2410954 Epoche=7111\n",
      "Epsilon=0.787789 Action_times=2412498 Epoche=7112\n",
      "Epsilon=0.787673 Action_times=2413991 Epoche=7113\n",
      "Epsilon=0.787638 Action_times=2414440 Epoche=7114\n",
      "Epsilon=0.787523 Action_times=2415918 Epoche=7115\n",
      "Epsilon=0.787482 Action_times=2416442 Epoche=7116\n",
      "Epsilon=0.787410 Action_times=2417376 Epoche=7117\n",
      "Epsilon=0.787259 Action_times=2419316 Epoche=7118\n",
      "Epsilon=0.787227 Action_times=2419723 Epoche=7119\n",
      "Epsilon=0.787216 Action_times=2419861 Epoche=7120\n",
      "Epsilon=0.787030 Action_times=2422266 Epoche=7121\n",
      "Epsilon=0.786772 Action_times=2425583 Epoche=7122\n",
      "Epsilon=0.786629 Action_times=2427418 Epoche=7123\n",
      "Epsilon=0.786576 Action_times=2428103 Epoche=7124\n",
      "Epsilon=0.786412 Action_times=2430214 Epoche=7125\n",
      "Epsilon=0.786316 Action_times=2431452 Epoche=7126\n",
      "Epsilon=0.786201 Action_times=2432929 Epoche=7127\n",
      "Epsilon=0.786164 Action_times=2433405 Epoche=7128\n",
      "Epsilon=0.786089 Action_times=2434371 Epoche=7129\n",
      "Epsilon=0.785945 Action_times=2436228 Epoche=7130\n",
      "Epsilon=0.785908 Action_times=2436706 Epoche=7131\n",
      "Epsilon=0.785757 Action_times=2438655 Epoche=7132\n",
      "Epsilon=0.785636 Action_times=2440210 Epoche=7133\n",
      "Epsilon=0.785542 Action_times=2441428 Epoche=7134\n",
      "Epsilon=0.785420 Action_times=2443003 Epoche=7135\n",
      "Epsilon=0.785284 Action_times=2444757 Epoche=7136\n",
      "Epsilon=0.785192 Action_times=2445940 Epoche=7137\n",
      "Epsilon=0.785138 Action_times=2446639 Epoche=7138\n",
      "Epsilon=0.785049 Action_times=2447784 Epoche=7139\n",
      "Epsilon=0.784954 Action_times=2449012 Epoche=7140\n",
      "Epsilon=0.784798 Action_times=2451025 Epoche=7141\n",
      "Epsilon=0.784635 Action_times=2453128 Epoche=7142\n",
      "Epsilon=0.784484 Action_times=2455085 Epoche=7143\n",
      "Epsilon=0.784318 Action_times=2457219 Epoche=7144\n",
      "Epsilon=0.784213 Action_times=2458580 Epoche=7145\n",
      "Epsilon=0.784117 Action_times=2459819 Epoche=7146\n",
      "Epsilon=0.784071 Action_times=2460416 Epoche=7147\n",
      "Epsilon=0.783915 Action_times=2462425 Epoche=7148\n",
      "Epsilon=0.783792 Action_times=2464018 Epoche=7149\n",
      "Epsilon=0.783747 Action_times=2464597 Epoche=7150\n",
      "Epsilon=0.783673 Action_times=2465558 Epoche=7151\n",
      "Epsilon=0.783635 Action_times=2466042 Epoche=7152\n",
      "Epsilon=0.783574 Action_times=2466834 Epoche=7153\n",
      "Epsilon=0.783504 Action_times=2467742 Epoche=7154\n",
      "Epsilon=0.783449 Action_times=2468453 Epoche=7155\n",
      "Epsilon=0.783394 Action_times=2469163 Epoche=7156\n",
      "Epsilon=0.783288 Action_times=2470532 Epoche=7157\n",
      "Epsilon=0.783171 Action_times=2472045 Epoche=7158\n",
      "Epsilon=0.782928 Action_times=2475185 Epoche=7159\n",
      "Epsilon=0.782889 Action_times=2475700 Epoche=7160\n",
      "Epsilon=0.782654 Action_times=2478739 Epoche=7161\n",
      "Epsilon=0.782499 Action_times=2480738 Epoche=7162\n",
      "Epsilon=0.782486 Action_times=2480917 Epoche=7163\n",
      "Epsilon=0.782373 Action_times=2482376 Epoche=7164\n",
      "Epsilon=0.782281 Action_times=2483569 Epoche=7165\n",
      "Epsilon=0.782259 Action_times=2483853 Epoche=7166\n",
      "Epsilon=0.782199 Action_times=2484632 Epoche=7167\n",
      "Epsilon=0.782159 Action_times=2485143 Epoche=7168\n",
      "Epsilon=0.782051 Action_times=2486549 Epoche=7169\n",
      "Epsilon=0.781913 Action_times=2488336 Epoche=7170\n",
      "Epsilon=0.781894 Action_times=2488579 Epoche=7171\n",
      "Epsilon=0.781797 Action_times=2489840 Epoche=7172\n",
      "Epsilon=0.781659 Action_times=2491622 Epoche=7173\n",
      "Epsilon=0.781549 Action_times=2493044 Epoche=7174\n",
      "Epsilon=0.781405 Action_times=2494917 Epoche=7175\n",
      "Epsilon=0.781236 Action_times=2497106 Epoche=7176\n",
      "Epsilon=0.781138 Action_times=2498376 Epoche=7177\n",
      "Epsilon=0.781001 Action_times=2500155 Epoche=7178\n",
      "Epsilon=0.780989 Action_times=2500307 Epoche=7179\n",
      "Epsilon=0.780905 Action_times=2501397 Epoche=7180\n",
      "Epsilon=0.780812 Action_times=2502604 Epoche=7181\n",
      "Epsilon=0.780655 Action_times=2504640 Epoche=7182\n",
      "Epsilon=0.780458 Action_times=2507193 Epoche=7183\n",
      "Epsilon=0.780252 Action_times=2509878 Epoche=7184\n",
      "Epsilon=0.780168 Action_times=2510966 Epoche=7185\n",
      "Epsilon=0.779972 Action_times=2513514 Epoche=7186\n",
      "Epsilon=0.779754 Action_times=2516343 Epoche=7187\n",
      "Epsilon=0.779591 Action_times=2518451 Epoche=7188\n",
      "Epsilon=0.779507 Action_times=2519548 Epoche=7189\n",
      "Epsilon=0.779398 Action_times=2520969 Epoche=7190\n",
      "Epsilon=0.779325 Action_times=2521917 Epoche=7191\n",
      "Epsilon=0.779201 Action_times=2523523 Epoche=7192\n",
      "Epsilon=0.779139 Action_times=2524334 Epoche=7193\n",
      "Epsilon=0.779135 Action_times=2524387 Epoche=7194\n",
      "Epsilon=0.779085 Action_times=2525034 Epoche=7195\n",
      "Epsilon=0.778954 Action_times=2526732 Epoche=7196\n",
      "Epsilon=0.778825 Action_times=2528421 Epoche=7197\n",
      "Epsilon=0.778743 Action_times=2529487 Epoche=7198\n",
      "Epsilon=0.778635 Action_times=2530883 Epoche=7199\n",
      "Epsilon=0.778577 Action_times=2531645 Epoche=7200\n",
      "Epsilon=0.778457 Action_times=2533203 Epoche=7201\n",
      "Epsilon=0.778321 Action_times=2534968 Epoche=7202\n",
      "Epsilon=0.778158 Action_times=2537096 Epoche=7203\n",
      "Epsilon=0.777856 Action_times=2541028 Epoche=7204\n",
      "Epsilon=0.777771 Action_times=2542136 Epoche=7205\n",
      "Epsilon=0.777723 Action_times=2542762 Epoche=7206\n",
      "Epsilon=0.777688 Action_times=2543209 Epoche=7207\n",
      "Epsilon=0.777593 Action_times=2544453 Epoche=7208\n",
      "Epsilon=0.777555 Action_times=2544948 Epoche=7209\n",
      "Epsilon=0.777409 Action_times=2546849 Epoche=7210\n",
      "Epsilon=0.777320 Action_times=2548011 Epoche=7211\n",
      "Epsilon=0.777243 Action_times=2549016 Epoche=7212\n",
      "Epsilon=0.777230 Action_times=2549187 Epoche=7213\n",
      "Epsilon=0.777148 Action_times=2550258 Epoche=7214\n",
      "Epsilon=0.776990 Action_times=2552317 Epoche=7215\n",
      "Epsilon=0.776822 Action_times=2554499 Epoche=7216\n",
      "Epsilon=0.776672 Action_times=2556453 Epoche=7217\n",
      "Epsilon=0.776571 Action_times=2557773 Epoche=7218\n",
      "Epsilon=0.776568 Action_times=2557815 Epoche=7219\n",
      "Epsilon=0.776387 Action_times=2560172 Epoche=7220\n",
      "Epsilon=0.776291 Action_times=2561427 Epoche=7221\n",
      "Epsilon=0.776142 Action_times=2563375 Epoche=7222\n",
      "Epsilon=0.776115 Action_times=2563725 Epoche=7223\n",
      "Epsilon=0.776068 Action_times=2564346 Epoche=7224\n",
      "Epsilon=0.775926 Action_times=2566196 Epoche=7225\n",
      "Epsilon=0.775826 Action_times=2567506 Epoche=7226\n",
      "Epsilon=0.775661 Action_times=2569648 Epoche=7227\n",
      "Epsilon=0.775577 Action_times=2570748 Epoche=7228\n",
      "Epsilon=0.775437 Action_times=2572579 Epoche=7229\n",
      "Epsilon=0.775272 Action_times=2574733 Epoche=7230\n",
      "Epsilon=0.775202 Action_times=2575651 Epoche=7231\n",
      "Epsilon=0.775165 Action_times=2576140 Epoche=7232\n",
      "Epsilon=0.775070 Action_times=2577379 Epoche=7233\n",
      "Epsilon=0.775041 Action_times=2577752 Epoche=7234\n",
      "Epsilon=0.775005 Action_times=2578221 Epoche=7235\n",
      "Epsilon=0.774850 Action_times=2580252 Epoche=7236\n",
      "Epsilon=0.774772 Action_times=2581274 Epoche=7237\n",
      "Epsilon=0.774594 Action_times=2583596 Epoche=7238\n",
      "Epsilon=0.774444 Action_times=2585563 Epoche=7239\n",
      "Epsilon=0.774407 Action_times=2586047 Epoche=7240\n",
      "Epsilon=0.774334 Action_times=2586996 Epoche=7241\n",
      "Epsilon=0.773997 Action_times=2591410 Epoche=7242\n",
      "Epsilon=0.773973 Action_times=2591727 Epoche=7243\n",
      "Epsilon=0.773767 Action_times=2594417 Epoche=7244\n",
      "Epsilon=0.773585 Action_times=2596806 Epoche=7245\n",
      "Epsilon=0.773431 Action_times=2598817 Epoche=7246\n",
      "Epsilon=0.773370 Action_times=2599615 Epoche=7247\n",
      "Epsilon=0.773267 Action_times=2600971 Epoche=7248\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.773235 Action_times=2601385 Epoche=7249\n",
      "Epsilon=0.773143 Action_times=2602598 Epoche=7250\n",
      "Epsilon=0.773046 Action_times=2603863 Epoche=7251\n",
      "Epsilon=0.772938 Action_times=2605286 Epoche=7252\n",
      "Epsilon=0.772864 Action_times=2606250 Epoche=7253\n",
      "Epsilon=0.772847 Action_times=2606474 Epoche=7254\n",
      "Epsilon=0.772772 Action_times=2607462 Epoche=7255\n",
      "Epsilon=0.772757 Action_times=2607657 Epoche=7256\n",
      "Epsilon=0.772673 Action_times=2608754 Epoche=7257\n",
      "Epsilon=0.772504 Action_times=2610978 Epoche=7258\n",
      "Epsilon=0.772405 Action_times=2612275 Epoche=7259\n",
      "Epsilon=0.772370 Action_times=2612727 Epoche=7260\n",
      "Epsilon=0.772319 Action_times=2613399 Epoche=7261\n",
      "Epsilon=0.772115 Action_times=2616069 Epoche=7262\n",
      "Epsilon=0.771965 Action_times=2618045 Epoche=7263\n",
      "Epsilon=0.771816 Action_times=2620004 Epoche=7264\n",
      "Epsilon=0.771742 Action_times=2620967 Epoche=7265\n",
      "Epsilon=0.771699 Action_times=2621541 Epoche=7266\n",
      "Epsilon=0.771510 Action_times=2624012 Epoche=7267\n",
      "Epsilon=0.771424 Action_times=2625141 Epoche=7268\n",
      "Epsilon=0.771380 Action_times=2625720 Epoche=7269\n",
      "Epsilon=0.771352 Action_times=2626091 Epoche=7270\n",
      "Epsilon=0.771199 Action_times=2628103 Epoche=7271\n",
      "Epsilon=0.771044 Action_times=2630138 Epoche=7272\n",
      "Epsilon=0.770905 Action_times=2631965 Epoche=7273\n",
      "Epsilon=0.770803 Action_times=2633302 Epoche=7274\n",
      "Epsilon=0.770612 Action_times=2635810 Epoche=7275\n",
      "Epsilon=0.770513 Action_times=2637111 Epoche=7276\n",
      "Epsilon=0.770487 Action_times=2637456 Epoche=7277\n",
      "Epsilon=0.770447 Action_times=2637989 Epoche=7278\n",
      "Epsilon=0.770383 Action_times=2638824 Epoche=7279\n",
      "Epsilon=0.770299 Action_times=2639937 Epoche=7280\n",
      "Epsilon=0.770175 Action_times=2641565 Epoche=7281\n",
      "Epsilon=0.770153 Action_times=2641846 Epoche=7282\n",
      "Epsilon=0.770031 Action_times=2643460 Epoche=7283\n",
      "Epsilon=0.769994 Action_times=2643947 Epoche=7284\n",
      "Epsilon=0.769851 Action_times=2645825 Epoche=7285\n",
      "Epsilon=0.769759 Action_times=2647032 Epoche=7286\n",
      "Epsilon=0.769628 Action_times=2648767 Epoche=7287\n",
      "Epsilon=0.769611 Action_times=2648988 Epoche=7288\n",
      "Epsilon=0.769597 Action_times=2649167 Epoche=7289\n",
      "Epsilon=0.769517 Action_times=2650219 Epoche=7290\n",
      "Epsilon=0.769337 Action_times=2652595 Epoche=7291\n",
      "Epsilon=0.769235 Action_times=2653935 Epoche=7292\n",
      "Epsilon=0.769109 Action_times=2655591 Epoche=7293\n",
      "Epsilon=0.768936 Action_times=2657869 Epoche=7294\n",
      "Epsilon=0.768929 Action_times=2657963 Epoche=7295\n",
      "Epsilon=0.768810 Action_times=2659541 Epoche=7296\n",
      "Epsilon=0.768737 Action_times=2660503 Epoche=7297\n",
      "Epsilon=0.768665 Action_times=2661441 Epoche=7298\n",
      "Epsilon=0.768661 Action_times=2661503 Epoche=7299\n",
      "Epsilon=0.768592 Action_times=2662409 Epoche=7300\n",
      "Epsilon=0.768499 Action_times=2663640 Epoche=7301\n",
      "Epsilon=0.768282 Action_times=2666490 Epoche=7302\n",
      "Epsilon=0.768280 Action_times=2666525 Epoche=7303\n",
      "Epsilon=0.768201 Action_times=2667565 Epoche=7304\n",
      "Epsilon=0.768099 Action_times=2668914 Epoche=7305\n",
      "Epsilon=0.768001 Action_times=2670207 Epoche=7306\n",
      "Epsilon=0.767839 Action_times=2672344 Epoche=7307\n",
      "Epsilon=0.767671 Action_times=2674556 Epoche=7308\n",
      "Epsilon=0.767508 Action_times=2676713 Epoche=7309\n",
      "Epsilon=0.767483 Action_times=2677038 Epoche=7310\n",
      "Epsilon=0.767377 Action_times=2678443 Epoche=7311\n",
      "Epsilon=0.767229 Action_times=2680397 Epoche=7312\n",
      "Epsilon=0.767074 Action_times=2682446 Epoche=7313\n",
      "Epsilon=0.766947 Action_times=2684117 Epoche=7314\n",
      "Epsilon=0.766944 Action_times=2684161 Epoche=7315\n",
      "Epsilon=0.766811 Action_times=2685908 Epoche=7316\n",
      "Epsilon=0.766727 Action_times=2687030 Epoche=7317\n",
      "Epsilon=0.766607 Action_times=2688616 Epoche=7318\n",
      "Epsilon=0.766480 Action_times=2690286 Epoche=7319\n",
      "Epsilon=0.766305 Action_times=2692608 Epoche=7320\n",
      "Epsilon=0.766271 Action_times=2693046 Epoche=7321\n",
      "Epsilon=0.766171 Action_times=2694373 Epoche=7322\n",
      "Epsilon=0.765944 Action_times=2697383 Epoche=7323\n",
      "Epsilon=0.765809 Action_times=2699160 Epoche=7324\n",
      "Epsilon=0.765668 Action_times=2701034 Epoche=7325\n",
      "Epsilon=0.765561 Action_times=2702438 Epoche=7326\n",
      "Epsilon=0.765501 Action_times=2703235 Epoche=7327\n",
      "Epsilon=0.765414 Action_times=2704384 Epoche=7328\n",
      "Epsilon=0.765266 Action_times=2706349 Epoche=7329\n",
      "Epsilon=0.765091 Action_times=2708668 Epoche=7330\n",
      "Epsilon=0.765026 Action_times=2709529 Epoche=7331\n",
      "Epsilon=0.764977 Action_times=2710180 Epoche=7332\n",
      "Epsilon=0.764957 Action_times=2710439 Epoche=7333\n",
      "Epsilon=0.764850 Action_times=2711864 Epoche=7334\n",
      "Epsilon=0.764805 Action_times=2712451 Epoche=7335\n",
      "Epsilon=0.764778 Action_times=2712809 Epoche=7336\n",
      "Epsilon=0.764687 Action_times=2714012 Epoche=7337\n",
      "Epsilon=0.764618 Action_times=2714935 Epoche=7338\n",
      "Epsilon=0.764518 Action_times=2716260 Epoche=7339\n",
      "Epsilon=0.764407 Action_times=2717735 Epoche=7340\n",
      "Epsilon=0.764331 Action_times=2718733 Epoche=7341\n",
      "Epsilon=0.764228 Action_times=2720106 Epoche=7342\n",
      "Epsilon=0.764065 Action_times=2722268 Epoche=7343\n",
      "Epsilon=0.763875 Action_times=2724788 Epoche=7344\n",
      "Epsilon=0.763803 Action_times=2725737 Epoche=7345\n",
      "Epsilon=0.763731 Action_times=2726698 Epoche=7346\n",
      "Epsilon=0.763632 Action_times=2728008 Epoche=7347\n",
      "Epsilon=0.763532 Action_times=2729340 Epoche=7348\n",
      "Epsilon=0.763347 Action_times=2731796 Epoche=7349\n",
      "Epsilon=0.763164 Action_times=2734215 Epoche=7350\n",
      "Epsilon=0.763067 Action_times=2735506 Epoche=7351\n",
      "Epsilon=0.763051 Action_times=2735722 Epoche=7352\n",
      "Epsilon=0.762814 Action_times=2738871 Epoche=7353\n",
      "Epsilon=0.762731 Action_times=2739966 Epoche=7354\n",
      "Epsilon=0.762548 Action_times=2742398 Epoche=7355\n",
      "Epsilon=0.762453 Action_times=2743662 Epoche=7356\n",
      "Epsilon=0.762342 Action_times=2745138 Epoche=7357\n",
      "Epsilon=0.762239 Action_times=2746508 Epoche=7358\n",
      "Epsilon=0.762032 Action_times=2749259 Epoche=7359\n",
      "Epsilon=0.761907 Action_times=2750929 Epoche=7360\n",
      "Epsilon=0.761791 Action_times=2752467 Epoche=7361\n",
      "Epsilon=0.761592 Action_times=2755109 Epoche=7362\n",
      "Epsilon=0.761544 Action_times=2755754 Epoche=7363\n",
      "Epsilon=0.761496 Action_times=2756394 Epoche=7364\n",
      "Epsilon=0.761356 Action_times=2758253 Epoche=7365\n",
      "Epsilon=0.761248 Action_times=2759694 Epoche=7366\n",
      "Epsilon=0.761127 Action_times=2761302 Epoche=7367\n",
      "Epsilon=0.761110 Action_times=2761525 Epoche=7368\n",
      "Epsilon=0.761036 Action_times=2762511 Epoche=7369\n",
      "Epsilon=0.760968 Action_times=2763421 Epoche=7370\n",
      "Epsilon=0.760804 Action_times=2765605 Epoche=7371\n",
      "Epsilon=0.760689 Action_times=2767134 Epoche=7372\n",
      "Epsilon=0.760652 Action_times=2767622 Epoche=7373\n",
      "Epsilon=0.760299 Action_times=2772336 Epoche=7374\n",
      "Epsilon=0.760133 Action_times=2774539 Epoche=7375\n",
      "Epsilon=0.760056 Action_times=2775568 Epoche=7376\n",
      "Epsilon=0.760006 Action_times=2776242 Epoche=7377\n",
      "Epsilon=0.759842 Action_times=2778423 Epoche=7378\n",
      "Epsilon=0.759801 Action_times=2778977 Epoche=7379\n",
      "Epsilon=0.759765 Action_times=2779457 Epoche=7380\n",
      "Epsilon=0.759671 Action_times=2780700 Epoche=7381\n",
      "Epsilon=0.759480 Action_times=2783249 Epoche=7382\n",
      "Epsilon=0.759359 Action_times=2784869 Epoche=7383\n",
      "Epsilon=0.759277 Action_times=2785966 Epoche=7384\n",
      "Epsilon=0.759068 Action_times=2788746 Epoche=7385\n",
      "Epsilon=0.759051 Action_times=2788979 Epoche=7386\n",
      "Epsilon=0.758902 Action_times=2790969 Epoche=7387\n",
      "Epsilon=0.758837 Action_times=2791833 Epoche=7388\n",
      "Epsilon=0.758795 Action_times=2792394 Epoche=7389\n",
      "Epsilon=0.758750 Action_times=2792996 Epoche=7390\n",
      "Epsilon=0.758702 Action_times=2793633 Epoche=7391\n",
      "Epsilon=0.758546 Action_times=2795727 Epoche=7392\n",
      "Epsilon=0.758416 Action_times=2797465 Epoche=7393\n",
      "Epsilon=0.758373 Action_times=2798033 Epoche=7394\n",
      "Epsilon=0.758301 Action_times=2799003 Epoche=7395\n",
      "Epsilon=0.758180 Action_times=2800609 Epoche=7396\n",
      "Epsilon=0.758084 Action_times=2801900 Epoche=7397\n",
      "Epsilon=0.758053 Action_times=2802313 Epoche=7398\n",
      "Epsilon=0.757917 Action_times=2804123 Epoche=7399\n",
      "Epsilon=0.757805 Action_times=2805630 Epoche=7400\n",
      "Epsilon=0.757767 Action_times=2806140 Epoche=7401\n",
      "Epsilon=0.757655 Action_times=2807638 Epoche=7402\n",
      "Epsilon=0.757577 Action_times=2808682 Epoche=7403\n",
      "Epsilon=0.757461 Action_times=2810227 Epoche=7404\n",
      "Epsilon=0.757298 Action_times=2812404 Epoche=7405\n",
      "Epsilon=0.757211 Action_times=2813571 Epoche=7406\n",
      "Epsilon=0.757090 Action_times=2815188 Epoche=7407\n",
      "Epsilon=0.757039 Action_times=2815874 Epoche=7408\n",
      "Epsilon=0.756943 Action_times=2817159 Epoche=7409\n",
      "Epsilon=0.756855 Action_times=2818337 Epoche=7410\n",
      "Epsilon=0.756648 Action_times=2821117 Epoche=7411\n",
      "Epsilon=0.756524 Action_times=2822777 Epoche=7412\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.756472 Action_times=2823468 Epoche=7413\n",
      "Epsilon=0.756444 Action_times=2823849 Epoche=7414\n",
      "Epsilon=0.756435 Action_times=2823967 Epoche=7415\n",
      "Epsilon=0.756350 Action_times=2825104 Epoche=7416\n",
      "Epsilon=0.756254 Action_times=2826391 Epoche=7417\n",
      "Epsilon=0.756191 Action_times=2827232 Epoche=7418\n",
      "Epsilon=0.756153 Action_times=2827737 Epoche=7419\n",
      "Epsilon=0.756121 Action_times=2828176 Epoche=7420\n",
      "Epsilon=0.756083 Action_times=2828678 Epoche=7421\n",
      "Epsilon=0.756010 Action_times=2829659 Epoche=7422\n",
      "Epsilon=0.755957 Action_times=2830374 Epoche=7423\n",
      "Epsilon=0.755841 Action_times=2831929 Epoche=7424\n",
      "Epsilon=0.755797 Action_times=2832515 Epoche=7425\n",
      "Epsilon=0.755721 Action_times=2833538 Epoche=7426\n",
      "Epsilon=0.755665 Action_times=2834280 Epoche=7427\n",
      "Epsilon=0.755453 Action_times=2837127 Epoche=7428\n",
      "Epsilon=0.755418 Action_times=2837602 Epoche=7429\n",
      "Epsilon=0.755337 Action_times=2838682 Epoche=7430\n",
      "Epsilon=0.755271 Action_times=2839567 Epoche=7431\n",
      "Epsilon=0.755183 Action_times=2840746 Epoche=7432\n",
      "Epsilon=0.755065 Action_times=2842334 Epoche=7433\n",
      "Epsilon=0.754960 Action_times=2843745 Epoche=7434\n",
      "Epsilon=0.754838 Action_times=2845385 Epoche=7435\n",
      "Epsilon=0.754769 Action_times=2846308 Epoche=7436\n",
      "Epsilon=0.754758 Action_times=2846458 Epoche=7437\n",
      "Epsilon=0.754724 Action_times=2846909 Epoche=7438\n",
      "Epsilon=0.754702 Action_times=2847203 Epoche=7439\n",
      "Epsilon=0.754558 Action_times=2849136 Epoche=7440\n",
      "Epsilon=0.754470 Action_times=2850321 Epoche=7441\n",
      "Epsilon=0.754310 Action_times=2852470 Epoche=7442\n",
      "Epsilon=0.754246 Action_times=2853336 Epoche=7443\n",
      "Epsilon=0.754175 Action_times=2854284 Epoche=7444\n",
      "Epsilon=0.754120 Action_times=2855023 Epoche=7445\n",
      "Epsilon=0.754062 Action_times=2855803 Epoche=7446\n",
      "Epsilon=0.753976 Action_times=2856957 Epoche=7447\n",
      "Epsilon=0.753937 Action_times=2857491 Epoche=7448\n",
      "Epsilon=0.753873 Action_times=2858343 Epoche=7449\n",
      "Epsilon=0.753842 Action_times=2858764 Epoche=7450\n",
      "Epsilon=0.753733 Action_times=2860230 Epoche=7451\n",
      "Epsilon=0.753567 Action_times=2862460 Epoche=7452\n",
      "Epsilon=0.753384 Action_times=2864927 Epoche=7453\n",
      "Epsilon=0.753203 Action_times=2867359 Epoche=7454\n",
      "Epsilon=0.753155 Action_times=2868004 Epoche=7455\n",
      "Epsilon=0.753028 Action_times=2869708 Epoche=7456\n",
      "Epsilon=0.752989 Action_times=2870243 Epoche=7457\n",
      "Epsilon=0.752883 Action_times=2871667 Epoche=7458\n",
      "Epsilon=0.752869 Action_times=2871848 Epoche=7459\n",
      "Epsilon=0.752678 Action_times=2874425 Epoche=7460\n",
      "Epsilon=0.752520 Action_times=2876552 Epoche=7461\n",
      "Epsilon=0.752473 Action_times=2877182 Epoche=7462\n",
      "Epsilon=0.752347 Action_times=2878884 Epoche=7463\n",
      "Epsilon=0.752070 Action_times=2882613 Epoche=7464\n",
      "Epsilon=0.751852 Action_times=2885548 Epoche=7465\n",
      "Epsilon=0.751757 Action_times=2886832 Epoche=7466\n",
      "Epsilon=0.751718 Action_times=2887352 Epoche=7467\n",
      "Epsilon=0.751671 Action_times=2887994 Epoche=7468\n",
      "Epsilon=0.751501 Action_times=2890285 Epoche=7469\n",
      "Epsilon=0.751361 Action_times=2892168 Epoche=7470\n",
      "Epsilon=0.751297 Action_times=2893035 Epoche=7471\n",
      "Epsilon=0.751231 Action_times=2893928 Epoche=7472\n",
      "Epsilon=0.751155 Action_times=2894953 Epoche=7473\n",
      "Epsilon=0.750990 Action_times=2897183 Epoche=7474\n",
      "Epsilon=0.750862 Action_times=2898904 Epoche=7475\n",
      "Epsilon=0.750714 Action_times=2900899 Epoche=7476\n",
      "Epsilon=0.750511 Action_times=2903643 Epoche=7477\n",
      "Epsilon=0.750403 Action_times=2905105 Epoche=7478\n",
      "Epsilon=0.750348 Action_times=2905850 Epoche=7479\n",
      "Epsilon=0.750187 Action_times=2908024 Epoche=7480\n",
      "Epsilon=0.750020 Action_times=2910281 Epoche=7481\n",
      "Epsilon=0.749918 Action_times=2911662 Epoche=7482\n",
      "Epsilon=0.749751 Action_times=2913911 Epoche=7483\n",
      "Epsilon=0.749673 Action_times=2914965 Epoche=7484\n",
      "Epsilon=0.749591 Action_times=2916070 Epoche=7485\n",
      "Epsilon=0.749446 Action_times=2918040 Epoche=7486\n",
      "Epsilon=0.749423 Action_times=2918346 Epoche=7487\n",
      "Epsilon=0.749358 Action_times=2919231 Epoche=7488\n",
      "Epsilon=0.749291 Action_times=2920129 Epoche=7489\n",
      "Epsilon=0.749184 Action_times=2921581 Epoche=7490\n",
      "Epsilon=0.749099 Action_times=2922726 Epoche=7491\n",
      "Epsilon=0.748955 Action_times=2924674 Epoche=7492\n",
      "Epsilon=0.748776 Action_times=2927105 Epoche=7493\n",
      "Epsilon=0.748587 Action_times=2929665 Epoche=7494\n",
      "Epsilon=0.748483 Action_times=2931070 Epoche=7495\n",
      "Epsilon=0.748441 Action_times=2931642 Epoche=7496\n",
      "Epsilon=0.748399 Action_times=2932209 Epoche=7497\n",
      "Epsilon=0.748178 Action_times=2935193 Epoche=7498\n",
      "Epsilon=0.748008 Action_times=2937505 Epoche=7499\n",
      "Epsilon=0.747985 Action_times=2937811 Epoche=7500\n",
      "Epsilon=0.747931 Action_times=2938541 Epoche=7501\n",
      "Epsilon=0.747888 Action_times=2939135 Epoche=7502\n",
      "Epsilon=0.747817 Action_times=2940085 Epoche=7503\n",
      "Epsilon=0.747782 Action_times=2940570 Epoche=7504\n",
      "Epsilon=0.747739 Action_times=2941148 Epoche=7505\n",
      "Epsilon=0.747679 Action_times=2941960 Epoche=7506\n",
      "Epsilon=0.747516 Action_times=2944178 Epoche=7507\n",
      "Epsilon=0.747457 Action_times=2944966 Epoche=7508\n",
      "Epsilon=0.747352 Action_times=2946391 Epoche=7509\n",
      "Epsilon=0.747087 Action_times=2949987 Epoche=7510\n",
      "Epsilon=0.746957 Action_times=2951754 Epoche=7511\n",
      "Epsilon=0.746929 Action_times=2952133 Epoche=7512\n",
      "Epsilon=0.746715 Action_times=2955038 Epoche=7513\n",
      "Epsilon=0.746576 Action_times=2956931 Epoche=7514\n",
      "Epsilon=0.746515 Action_times=2957759 Epoche=7515\n",
      "Epsilon=0.746270 Action_times=2961078 Epoche=7516\n",
      "Epsilon=0.746204 Action_times=2961976 Epoche=7517\n",
      "Epsilon=0.746082 Action_times=2963635 Epoche=7518\n",
      "Epsilon=0.745971 Action_times=2965141 Epoche=7519\n",
      "Epsilon=0.745942 Action_times=2965542 Epoche=7520\n",
      "Epsilon=0.745836 Action_times=2966972 Epoche=7521\n",
      "Epsilon=0.745774 Action_times=2967820 Epoche=7522\n",
      "Epsilon=0.745733 Action_times=2968377 Epoche=7523\n",
      "Epsilon=0.745662 Action_times=2969339 Epoche=7524\n",
      "Epsilon=0.745566 Action_times=2970642 Epoche=7525\n",
      "Epsilon=0.745418 Action_times=2972656 Epoche=7526\n",
      "Epsilon=0.745348 Action_times=2973610 Epoche=7527\n",
      "Epsilon=0.745214 Action_times=2975434 Epoche=7528\n",
      "Epsilon=0.745084 Action_times=2977195 Epoche=7529\n",
      "Epsilon=0.745010 Action_times=2978215 Epoche=7530\n",
      "Epsilon=0.744923 Action_times=2979393 Epoche=7531\n",
      "Epsilon=0.744802 Action_times=2981040 Epoche=7532\n",
      "Epsilon=0.744792 Action_times=2981176 Epoche=7533\n",
      "Epsilon=0.744702 Action_times=2982399 Epoche=7534\n",
      "Epsilon=0.744636 Action_times=2983296 Epoche=7535\n",
      "Epsilon=0.744445 Action_times=2985895 Epoche=7536\n",
      "Epsilon=0.744391 Action_times=2986630 Epoche=7537\n",
      "Epsilon=0.744356 Action_times=2987104 Epoche=7538\n",
      "Epsilon=0.744325 Action_times=2987531 Epoche=7539\n",
      "Epsilon=0.744238 Action_times=2988713 Epoche=7540\n",
      "Epsilon=0.744172 Action_times=2989618 Epoche=7541\n",
      "Epsilon=0.744040 Action_times=2991411 Epoche=7542\n",
      "Epsilon=0.744005 Action_times=2991892 Epoche=7543\n",
      "Epsilon=0.743866 Action_times=2993781 Epoche=7544\n",
      "Epsilon=0.743847 Action_times=2994049 Epoche=7545\n",
      "Epsilon=0.743807 Action_times=2994592 Epoche=7546\n",
      "Epsilon=0.743773 Action_times=2995059 Epoche=7547\n",
      "Epsilon=0.743744 Action_times=2995451 Epoche=7548\n",
      "Epsilon=0.743688 Action_times=2996215 Epoche=7549\n",
      "Epsilon=0.743579 Action_times=2997701 Epoche=7550\n",
      "Epsilon=0.743524 Action_times=2998444 Epoche=7551\n",
      "Epsilon=0.743466 Action_times=2999236 Epoche=7552\n",
      "Epsilon=0.743369 Action_times=3000561 Epoche=7553\n",
      "Epsilon=0.743200 Action_times=3002864 Epoche=7554\n",
      "Epsilon=0.743063 Action_times=3004731 Epoche=7555\n",
      "Epsilon=0.743029 Action_times=3005196 Epoche=7556\n",
      "Epsilon=0.742867 Action_times=3007401 Epoche=7557\n",
      "Epsilon=0.742501 Action_times=3012397 Epoche=7558\n",
      "Epsilon=0.742394 Action_times=3013867 Epoche=7559\n",
      "Epsilon=0.742279 Action_times=3015434 Epoche=7560\n",
      "Epsilon=0.742201 Action_times=3016499 Epoche=7561\n",
      "Epsilon=0.742122 Action_times=3017577 Epoche=7562\n",
      "Epsilon=0.741988 Action_times=3019403 Epoche=7563\n",
      "Epsilon=0.741925 Action_times=3020275 Epoche=7564\n",
      "Epsilon=0.741821 Action_times=3021694 Epoche=7565\n",
      "Epsilon=0.741698 Action_times=3023364 Epoche=7566\n",
      "Epsilon=0.741477 Action_times=3026392 Epoche=7567\n",
      "Epsilon=0.741451 Action_times=3026751 Epoche=7568\n",
      "Epsilon=0.741350 Action_times=3028131 Epoche=7569\n",
      "Epsilon=0.741170 Action_times=3030588 Epoche=7570\n",
      "Epsilon=0.741040 Action_times=3032371 Epoche=7571\n",
      "Epsilon=0.740990 Action_times=3033051 Epoche=7572\n",
      "Epsilon=0.740918 Action_times=3034036 Epoche=7573\n",
      "Epsilon=0.740826 Action_times=3035290 Epoche=7574\n",
      "Epsilon=0.740781 Action_times=3035914 Epoche=7575\n",
      "Epsilon=0.740720 Action_times=3036746 Epoche=7576\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.740606 Action_times=3038309 Epoche=7577\n",
      "Epsilon=0.740542 Action_times=3039187 Epoche=7578\n",
      "Epsilon=0.740442 Action_times=3040557 Epoche=7579\n",
      "Epsilon=0.740409 Action_times=3040998 Epoche=7580\n",
      "Epsilon=0.740306 Action_times=3042417 Epoche=7581\n",
      "Epsilon=0.740270 Action_times=3042904 Epoche=7582\n",
      "Epsilon=0.740255 Action_times=3043112 Epoche=7583\n",
      "Epsilon=0.740181 Action_times=3044130 Epoche=7584\n",
      "Epsilon=0.740135 Action_times=3044752 Epoche=7585\n",
      "Epsilon=0.740046 Action_times=3045976 Epoche=7586\n",
      "Epsilon=0.740021 Action_times=3046314 Epoche=7587\n",
      "Epsilon=0.739939 Action_times=3047434 Epoche=7588\n",
      "Epsilon=0.739687 Action_times=3050886 Epoche=7589\n",
      "Epsilon=0.739609 Action_times=3051962 Epoche=7590\n",
      "Epsilon=0.739579 Action_times=3052377 Epoche=7591\n",
      "Epsilon=0.739527 Action_times=3053090 Epoche=7592\n",
      "Epsilon=0.739478 Action_times=3053754 Epoche=7593\n",
      "Epsilon=0.739193 Action_times=3057661 Epoche=7594\n",
      "Epsilon=0.738953 Action_times=3060954 Epoche=7595\n",
      "Epsilon=0.738773 Action_times=3063433 Epoche=7596\n",
      "Epsilon=0.738719 Action_times=3064171 Epoche=7597\n",
      "Epsilon=0.738579 Action_times=3066095 Epoche=7598\n",
      "Epsilon=0.738430 Action_times=3068138 Epoche=7599\n",
      "Epsilon=0.738369 Action_times=3068965 Epoche=7600\n",
      "Epsilon=0.738294 Action_times=3069996 Epoche=7601\n",
      "Epsilon=0.738211 Action_times=3071137 Epoche=7602\n",
      "Epsilon=0.738046 Action_times=3073409 Epoche=7603\n",
      "Epsilon=0.737909 Action_times=3075290 Epoche=7604\n",
      "Epsilon=0.737866 Action_times=3075873 Epoche=7605\n",
      "Epsilon=0.737823 Action_times=3076470 Epoche=7606\n",
      "Epsilon=0.737792 Action_times=3076896 Epoche=7607\n",
      "Epsilon=0.737719 Action_times=3077895 Epoche=7608\n",
      "Epsilon=0.737584 Action_times=3079756 Epoche=7609\n",
      "Epsilon=0.737539 Action_times=3080379 Epoche=7610\n",
      "Epsilon=0.737377 Action_times=3082594 Epoche=7611\n",
      "Epsilon=0.737267 Action_times=3084110 Epoche=7612\n",
      "Epsilon=0.736911 Action_times=3089011 Epoche=7613\n",
      "Epsilon=0.736704 Action_times=3091851 Epoche=7614\n",
      "Epsilon=0.736684 Action_times=3092135 Epoche=7615\n",
      "Epsilon=0.736607 Action_times=3093190 Epoche=7616\n",
      "Epsilon=0.736595 Action_times=3093355 Epoche=7617\n",
      "Epsilon=0.736505 Action_times=3094596 Epoche=7618\n",
      "Epsilon=0.736394 Action_times=3096127 Epoche=7619\n",
      "Epsilon=0.736227 Action_times=3098428 Epoche=7620\n",
      "Epsilon=0.736199 Action_times=3098804 Epoche=7621\n",
      "Epsilon=0.736169 Action_times=3099223 Epoche=7622\n",
      "Epsilon=0.736063 Action_times=3100678 Epoche=7623\n",
      "Epsilon=0.735989 Action_times=3101701 Epoche=7624\n",
      "Epsilon=0.735965 Action_times=3102038 Epoche=7625\n",
      "Epsilon=0.735909 Action_times=3102804 Epoche=7626\n",
      "Epsilon=0.735881 Action_times=3103187 Epoche=7627\n",
      "Epsilon=0.735843 Action_times=3103715 Epoche=7628\n",
      "Epsilon=0.735787 Action_times=3104487 Epoche=7629\n",
      "Epsilon=0.735757 Action_times=3104894 Epoche=7630\n",
      "Epsilon=0.735463 Action_times=3108948 Epoche=7631\n",
      "Epsilon=0.735361 Action_times=3110361 Epoche=7632\n",
      "Epsilon=0.735274 Action_times=3111561 Epoche=7633\n",
      "Epsilon=0.735265 Action_times=3111681 Epoche=7634\n",
      "Epsilon=0.735230 Action_times=3112159 Epoche=7635\n",
      "Epsilon=0.735122 Action_times=3113653 Epoche=7636\n",
      "Epsilon=0.734948 Action_times=3116056 Epoche=7637\n",
      "Epsilon=0.734832 Action_times=3117652 Epoche=7638\n",
      "Epsilon=0.734800 Action_times=3118098 Epoche=7639\n",
      "Epsilon=0.734614 Action_times=3120652 Epoche=7640\n",
      "Epsilon=0.734566 Action_times=3121318 Epoche=7641\n",
      "Epsilon=0.734495 Action_times=3122307 Epoche=7642\n",
      "Epsilon=0.734467 Action_times=3122694 Epoche=7643\n",
      "Epsilon=0.734192 Action_times=3126481 Epoche=7644\n",
      "Epsilon=0.734026 Action_times=3128778 Epoche=7645\n",
      "Epsilon=0.733980 Action_times=3129413 Epoche=7646\n",
      "Epsilon=0.733932 Action_times=3130071 Epoche=7647\n",
      "Epsilon=0.733880 Action_times=3130787 Epoche=7648\n",
      "Epsilon=0.733847 Action_times=3131245 Epoche=7649\n",
      "Epsilon=0.733830 Action_times=3131480 Epoche=7650\n",
      "Epsilon=0.733733 Action_times=3132822 Epoche=7651\n",
      "Epsilon=0.733659 Action_times=3133852 Epoche=7652\n",
      "Epsilon=0.733644 Action_times=3134049 Epoche=7653\n",
      "Epsilon=0.733580 Action_times=3134937 Epoche=7654\n",
      "Epsilon=0.733556 Action_times=3135276 Epoche=7655\n",
      "Epsilon=0.733491 Action_times=3136165 Epoche=7656\n",
      "Epsilon=0.733373 Action_times=3137806 Epoche=7657\n",
      "Epsilon=0.733300 Action_times=3138815 Epoche=7658\n",
      "Epsilon=0.733244 Action_times=3139587 Epoche=7659\n",
      "Epsilon=0.733170 Action_times=3140604 Epoche=7660\n",
      "Epsilon=0.733157 Action_times=3140787 Epoche=7661\n",
      "Epsilon=0.733108 Action_times=3141460 Epoche=7662\n",
      "Epsilon=0.732985 Action_times=3143167 Epoche=7663\n",
      "Epsilon=0.732801 Action_times=3145712 Epoche=7664\n",
      "Epsilon=0.732720 Action_times=3146833 Epoche=7665\n",
      "Epsilon=0.732599 Action_times=3148505 Epoche=7666\n",
      "Epsilon=0.732581 Action_times=3148754 Epoche=7667\n",
      "Epsilon=0.732541 Action_times=3149308 Epoche=7668\n",
      "Epsilon=0.732380 Action_times=3151532 Epoche=7669\n",
      "Epsilon=0.732313 Action_times=3152469 Epoche=7670\n",
      "Epsilon=0.732204 Action_times=3153970 Epoche=7671\n",
      "Epsilon=0.732147 Action_times=3154756 Epoche=7672\n",
      "Epsilon=0.732033 Action_times=3156347 Epoche=7673\n",
      "Epsilon=0.731871 Action_times=3158589 Epoche=7674\n",
      "Epsilon=0.731769 Action_times=3160001 Epoche=7675\n",
      "Epsilon=0.731727 Action_times=3160574 Epoche=7676\n",
      "Epsilon=0.731634 Action_times=3161863 Epoche=7677\n",
      "Epsilon=0.731569 Action_times=3162772 Epoche=7678\n",
      "Epsilon=0.731490 Action_times=3163868 Epoche=7679\n",
      "Epsilon=0.731402 Action_times=3165078 Epoche=7680\n",
      "Epsilon=0.731334 Action_times=3166023 Epoche=7681\n",
      "Epsilon=0.731106 Action_times=3169189 Epoche=7682\n",
      "Epsilon=0.730948 Action_times=3171383 Epoche=7683\n",
      "Epsilon=0.730839 Action_times=3172891 Epoche=7684\n",
      "Epsilon=0.730807 Action_times=3173337 Epoche=7685\n",
      "Epsilon=0.730747 Action_times=3174170 Epoche=7686\n",
      "Epsilon=0.730701 Action_times=3174799 Epoche=7687\n",
      "Epsilon=0.730581 Action_times=3176477 Epoche=7688\n",
      "Epsilon=0.730522 Action_times=3177295 Epoche=7689\n",
      "Epsilon=0.730471 Action_times=3177994 Epoche=7690\n",
      "Epsilon=0.730254 Action_times=3181007 Epoche=7691\n",
      "Epsilon=0.730167 Action_times=3182217 Epoche=7692\n",
      "Epsilon=0.730068 Action_times=3183599 Epoche=7693\n",
      "Epsilon=0.729998 Action_times=3184564 Epoche=7694\n",
      "Epsilon=0.729947 Action_times=3185272 Epoche=7695\n",
      "Epsilon=0.729890 Action_times=3186066 Epoche=7696\n",
      "Epsilon=0.729852 Action_times=3186596 Epoche=7697\n",
      "Epsilon=0.729771 Action_times=3187718 Epoche=7698\n",
      "Epsilon=0.729750 Action_times=3188014 Epoche=7699\n",
      "Epsilon=0.729721 Action_times=3188416 Epoche=7700\n",
      "Epsilon=0.729674 Action_times=3189064 Epoche=7701\n",
      "Epsilon=0.729570 Action_times=3190515 Epoche=7702\n",
      "Epsilon=0.729556 Action_times=3190704 Epoche=7703\n",
      "Epsilon=0.729521 Action_times=3191195 Epoche=7704\n",
      "Epsilon=0.729413 Action_times=3192691 Epoche=7705\n",
      "Epsilon=0.729255 Action_times=3194895 Epoche=7706\n",
      "Epsilon=0.729188 Action_times=3195828 Epoche=7707\n",
      "Epsilon=0.729139 Action_times=3196501 Epoche=7708\n",
      "Epsilon=0.729082 Action_times=3197290 Epoche=7709\n",
      "Epsilon=0.728960 Action_times=3198988 Epoche=7710\n",
      "Epsilon=0.728796 Action_times=3201272 Epoche=7711\n",
      "Epsilon=0.728660 Action_times=3203172 Epoche=7712\n",
      "Epsilon=0.728617 Action_times=3203764 Epoche=7713\n",
      "Epsilon=0.728454 Action_times=3206033 Epoche=7714\n",
      "Epsilon=0.728266 Action_times=3208656 Epoche=7715\n",
      "Epsilon=0.728176 Action_times=3209907 Epoche=7716\n",
      "Epsilon=0.728004 Action_times=3212300 Epoche=7717\n",
      "Epsilon=0.727933 Action_times=3213284 Epoche=7718\n",
      "Epsilon=0.727896 Action_times=3213809 Epoche=7719\n",
      "Epsilon=0.727796 Action_times=3215200 Epoche=7720\n",
      "Epsilon=0.727758 Action_times=3215719 Epoche=7721\n",
      "Epsilon=0.727675 Action_times=3216883 Epoche=7722\n",
      "Epsilon=0.727578 Action_times=3218228 Epoche=7723\n",
      "Epsilon=0.727510 Action_times=3219181 Epoche=7724\n",
      "Epsilon=0.727477 Action_times=3219642 Epoche=7725\n",
      "Epsilon=0.727366 Action_times=3221183 Epoche=7726\n",
      "Epsilon=0.727161 Action_times=3224050 Epoche=7727\n",
      "Epsilon=0.726996 Action_times=3226347 Epoche=7728\n",
      "Epsilon=0.726875 Action_times=3228037 Epoche=7729\n",
      "Epsilon=0.726800 Action_times=3229083 Epoche=7730\n",
      "Epsilon=0.726712 Action_times=3230315 Epoche=7731\n",
      "Epsilon=0.726684 Action_times=3230699 Epoche=7732\n",
      "Epsilon=0.726606 Action_times=3231784 Epoche=7733\n",
      "Epsilon=0.726532 Action_times=3232822 Epoche=7734\n",
      "Epsilon=0.726477 Action_times=3233590 Epoche=7735\n",
      "Epsilon=0.726430 Action_times=3234250 Epoche=7736\n",
      "Epsilon=0.726297 Action_times=3236104 Epoche=7737\n",
      "Epsilon=0.726205 Action_times=3237382 Epoche=7738\n",
      "Epsilon=0.726171 Action_times=3237860 Epoche=7739\n",
      "Epsilon=0.726104 Action_times=3238802 Epoche=7740\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.726061 Action_times=3239393 Epoche=7741\n",
      "Epsilon=0.725960 Action_times=3240804 Epoche=7742\n",
      "Epsilon=0.725950 Action_times=3240944 Epoche=7743\n",
      "Epsilon=0.725929 Action_times=3241242 Epoche=7744\n",
      "Epsilon=0.725802 Action_times=3243010 Epoche=7745\n",
      "Epsilon=0.725635 Action_times=3245348 Epoche=7746\n",
      "Epsilon=0.725513 Action_times=3247056 Epoche=7747\n",
      "Epsilon=0.725457 Action_times=3247837 Epoche=7748\n",
      "Epsilon=0.725361 Action_times=3249172 Epoche=7749\n",
      "Epsilon=0.725248 Action_times=3250763 Epoche=7750\n",
      "Epsilon=0.725094 Action_times=3252915 Epoche=7751\n",
      "Epsilon=0.725009 Action_times=3254095 Epoche=7752\n",
      "Epsilon=0.724887 Action_times=3255800 Epoche=7753\n",
      "Epsilon=0.724829 Action_times=3256622 Epoche=7754\n",
      "Epsilon=0.724800 Action_times=3257027 Epoche=7755\n",
      "Epsilon=0.724700 Action_times=3258421 Epoche=7756\n",
      "Epsilon=0.724625 Action_times=3259465 Epoche=7757\n",
      "Epsilon=0.724566 Action_times=3260290 Epoche=7758\n",
      "Epsilon=0.724543 Action_times=3260612 Epoche=7759\n",
      "Epsilon=0.724509 Action_times=3261096 Epoche=7760\n",
      "Epsilon=0.724472 Action_times=3261608 Epoche=7761\n",
      "Epsilon=0.724366 Action_times=3263102 Epoche=7762\n",
      "Epsilon=0.724256 Action_times=3264630 Epoche=7763\n",
      "Epsilon=0.724135 Action_times=3266326 Epoche=7764\n",
      "Epsilon=0.724113 Action_times=3266634 Epoche=7765\n",
      "Epsilon=0.723970 Action_times=3268645 Epoche=7766\n",
      "Epsilon=0.723946 Action_times=3268983 Epoche=7767\n",
      "Epsilon=0.723838 Action_times=3270492 Epoche=7768\n",
      "Epsilon=0.723781 Action_times=3271291 Epoche=7769\n",
      "Epsilon=0.723748 Action_times=3271751 Epoche=7770\n",
      "Epsilon=0.723647 Action_times=3273171 Epoche=7771\n",
      "Epsilon=0.723599 Action_times=3273840 Epoche=7772\n",
      "Epsilon=0.723555 Action_times=3274451 Epoche=7773\n",
      "Epsilon=0.723506 Action_times=3275145 Epoche=7774\n",
      "Epsilon=0.723418 Action_times=3276375 Epoche=7775\n",
      "Epsilon=0.723371 Action_times=3277027 Epoche=7776\n",
      "Epsilon=0.723341 Action_times=3277448 Epoche=7777\n",
      "Epsilon=0.723263 Action_times=3278547 Epoche=7778\n",
      "Epsilon=0.723203 Action_times=3279390 Epoche=7779\n",
      "Epsilon=0.723140 Action_times=3280277 Epoche=7780\n",
      "Epsilon=0.722950 Action_times=3282936 Epoche=7781\n",
      "Epsilon=0.722837 Action_times=3284523 Epoche=7782\n",
      "Epsilon=0.722729 Action_times=3286038 Epoche=7783\n",
      "Epsilon=0.722552 Action_times=3288516 Epoche=7784\n",
      "Epsilon=0.722489 Action_times=3289408 Epoche=7785\n",
      "Epsilon=0.722449 Action_times=3289962 Epoche=7786\n",
      "Epsilon=0.722401 Action_times=3290637 Epoche=7787\n",
      "Epsilon=0.722336 Action_times=3291548 Epoche=7788\n",
      "Epsilon=0.722253 Action_times=3292714 Epoche=7789\n",
      "Epsilon=0.722172 Action_times=3293853 Epoche=7790\n",
      "Epsilon=0.722132 Action_times=3294418 Epoche=7791\n",
      "Epsilon=0.722092 Action_times=3294972 Epoche=7792\n",
      "Epsilon=0.722048 Action_times=3295593 Epoche=7793\n",
      "Epsilon=0.722016 Action_times=3296051 Epoche=7794\n",
      "Epsilon=0.721912 Action_times=3297511 Epoche=7795\n",
      "Epsilon=0.721898 Action_times=3297697 Epoche=7796\n",
      "Epsilon=0.721817 Action_times=3298835 Epoche=7797\n",
      "Epsilon=0.721711 Action_times=3300326 Epoche=7798\n",
      "Epsilon=0.721658 Action_times=3301073 Epoche=7799\n",
      "Epsilon=0.721600 Action_times=3301888 Epoche=7800\n",
      "Epsilon=0.721479 Action_times=3303587 Epoche=7801\n",
      "Epsilon=0.721468 Action_times=3303751 Epoche=7802\n",
      "Epsilon=0.721400 Action_times=3304703 Epoche=7803\n",
      "Epsilon=0.721304 Action_times=3306052 Epoche=7804\n",
      "Epsilon=0.721214 Action_times=3307314 Epoche=7805\n",
      "Epsilon=0.721077 Action_times=3309237 Epoche=7806\n",
      "Epsilon=0.721021 Action_times=3310032 Epoche=7807\n",
      "Epsilon=0.720961 Action_times=3310879 Epoche=7808\n",
      "Epsilon=0.720921 Action_times=3311439 Epoche=7809\n",
      "Epsilon=0.720712 Action_times=3314375 Epoche=7810\n",
      "Epsilon=0.720633 Action_times=3315482 Epoche=7811\n",
      "Epsilon=0.720516 Action_times=3317133 Epoche=7812\n",
      "Epsilon=0.720504 Action_times=3317297 Epoche=7813\n",
      "Epsilon=0.720447 Action_times=3318111 Epoche=7814\n",
      "Epsilon=0.720334 Action_times=3319696 Epoche=7815\n",
      "Epsilon=0.720256 Action_times=3320801 Epoche=7816\n",
      "Epsilon=0.720202 Action_times=3321558 Epoche=7817\n",
      "Epsilon=0.720096 Action_times=3323048 Epoche=7818\n",
      "Epsilon=0.719982 Action_times=3324655 Epoche=7819\n",
      "Epsilon=0.719893 Action_times=3325906 Epoche=7820\n",
      "Epsilon=0.719849 Action_times=3326520 Epoche=7821\n",
      "Epsilon=0.719840 Action_times=3326649 Epoche=7822\n",
      "Epsilon=0.719819 Action_times=3326950 Epoche=7823\n",
      "Epsilon=0.719709 Action_times=3328495 Epoche=7824\n",
      "Epsilon=0.719678 Action_times=3328935 Epoche=7825\n",
      "Epsilon=0.719577 Action_times=3330361 Epoche=7826\n",
      "Epsilon=0.719520 Action_times=3331167 Epoche=7827\n",
      "Epsilon=0.719481 Action_times=3331712 Epoche=7828\n",
      "Epsilon=0.719452 Action_times=3332115 Epoche=7829\n",
      "Epsilon=0.719416 Action_times=3332627 Epoche=7830\n",
      "Epsilon=0.719374 Action_times=3333218 Epoche=7831\n",
      "Epsilon=0.719303 Action_times=3334218 Epoche=7832\n",
      "Epsilon=0.719279 Action_times=3334560 Epoche=7833\n",
      "Epsilon=0.719202 Action_times=3335641 Epoche=7834\n",
      "Epsilon=0.719160 Action_times=3336234 Epoche=7835\n",
      "Epsilon=0.719105 Action_times=3337014 Epoche=7836\n",
      "Epsilon=0.719068 Action_times=3337534 Epoche=7837\n",
      "Epsilon=0.719026 Action_times=3338124 Epoche=7838\n",
      "Epsilon=0.718988 Action_times=3338663 Epoche=7839\n",
      "Epsilon=0.718870 Action_times=3340321 Epoche=7840\n",
      "Epsilon=0.718794 Action_times=3341404 Epoche=7841\n",
      "Epsilon=0.718716 Action_times=3342497 Epoche=7842\n",
      "Epsilon=0.718677 Action_times=3343054 Epoche=7843\n",
      "Epsilon=0.718603 Action_times=3344097 Epoche=7844\n",
      "Epsilon=0.718488 Action_times=3345714 Epoche=7845\n",
      "Epsilon=0.718395 Action_times=3347038 Epoche=7846\n",
      "Epsilon=0.718356 Action_times=3347582 Epoche=7847\n",
      "Epsilon=0.718275 Action_times=3348724 Epoche=7848\n",
      "Epsilon=0.718147 Action_times=3350534 Epoche=7849\n",
      "Epsilon=0.718109 Action_times=3351067 Epoche=7850\n",
      "Epsilon=0.718039 Action_times=3352058 Epoche=7851\n",
      "Epsilon=0.718022 Action_times=3352293 Epoche=7852\n",
      "Epsilon=0.717911 Action_times=3353859 Epoche=7853\n",
      "Epsilon=0.717714 Action_times=3356652 Epoche=7854\n",
      "Epsilon=0.717592 Action_times=3358368 Epoche=7855\n",
      "Epsilon=0.717496 Action_times=3359731 Epoche=7856\n",
      "Epsilon=0.717421 Action_times=3360785 Epoche=7857\n",
      "Epsilon=0.717387 Action_times=3361276 Epoche=7858\n",
      "Epsilon=0.717291 Action_times=3362628 Epoche=7859\n",
      "Epsilon=0.717266 Action_times=3362981 Epoche=7860\n",
      "Epsilon=0.717202 Action_times=3363890 Epoche=7861\n",
      "Epsilon=0.717172 Action_times=3364308 Epoche=7862\n",
      "Epsilon=0.717115 Action_times=3365121 Epoche=7863\n",
      "Epsilon=0.717113 Action_times=3365151 Epoche=7864\n",
      "Epsilon=0.717078 Action_times=3365641 Epoche=7865\n",
      "Epsilon=0.716982 Action_times=3366991 Epoche=7866\n",
      "Epsilon=0.716924 Action_times=3367820 Epoche=7867\n",
      "Epsilon=0.716915 Action_times=3367939 Epoche=7868\n",
      "Epsilon=0.716865 Action_times=3368646 Epoche=7869\n",
      "Epsilon=0.716793 Action_times=3369673 Epoche=7870\n",
      "Epsilon=0.716751 Action_times=3370263 Epoche=7871\n",
      "Epsilon=0.716722 Action_times=3370678 Epoche=7872\n",
      "Epsilon=0.716597 Action_times=3372438 Epoche=7873\n",
      "Epsilon=0.716545 Action_times=3373180 Epoche=7874\n",
      "Epsilon=0.716389 Action_times=3375391 Epoche=7875\n",
      "Epsilon=0.716331 Action_times=3376212 Epoche=7876\n",
      "Epsilon=0.716214 Action_times=3377873 Epoche=7877\n",
      "Epsilon=0.716097 Action_times=3379517 Epoche=7878\n",
      "Epsilon=0.716088 Action_times=3379656 Epoche=7879\n",
      "Epsilon=0.716040 Action_times=3380331 Epoche=7880\n",
      "Epsilon=0.715909 Action_times=3382190 Epoche=7881\n",
      "Epsilon=0.715866 Action_times=3382795 Epoche=7882\n",
      "Epsilon=0.715788 Action_times=3383896 Epoche=7883\n",
      "Epsilon=0.715706 Action_times=3385063 Epoche=7884\n",
      "Epsilon=0.715659 Action_times=3385724 Epoche=7885\n",
      "Epsilon=0.715550 Action_times=3387266 Epoche=7886\n",
      "Epsilon=0.715465 Action_times=3388478 Epoche=7887\n",
      "Epsilon=0.715339 Action_times=3390269 Epoche=7888\n",
      "Epsilon=0.715291 Action_times=3390949 Epoche=7889\n",
      "Epsilon=0.715218 Action_times=3391982 Epoche=7890\n",
      "Epsilon=0.715140 Action_times=3393079 Epoche=7891\n",
      "Epsilon=0.715077 Action_times=3393980 Epoche=7892\n",
      "Epsilon=0.714929 Action_times=3396078 Epoche=7893\n",
      "Epsilon=0.714802 Action_times=3397883 Epoche=7894\n",
      "Epsilon=0.714689 Action_times=3399478 Epoche=7895\n",
      "Epsilon=0.714627 Action_times=3400357 Epoche=7896\n",
      "Epsilon=0.714578 Action_times=3401059 Epoche=7897\n",
      "Epsilon=0.714499 Action_times=3402175 Epoche=7898\n",
      "Epsilon=0.714451 Action_times=3402864 Epoche=7899\n",
      "Epsilon=0.714390 Action_times=3403723 Epoche=7900\n",
      "Epsilon=0.714353 Action_times=3404248 Epoche=7901\n",
      "Epsilon=0.714215 Action_times=3406215 Epoche=7902\n",
      "Epsilon=0.714146 Action_times=3407193 Epoche=7903\n",
      "Epsilon=0.714133 Action_times=3407378 Epoche=7904\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.714104 Action_times=3407783 Epoche=7905\n",
      "Epsilon=0.713995 Action_times=3409331 Epoche=7906\n",
      "Epsilon=0.713941 Action_times=3410099 Epoche=7907\n",
      "Epsilon=0.713894 Action_times=3410766 Epoche=7908\n",
      "Epsilon=0.713827 Action_times=3411723 Epoche=7909\n",
      "Epsilon=0.713807 Action_times=3412012 Epoche=7910\n",
      "Epsilon=0.713658 Action_times=3414129 Epoche=7911\n",
      "Epsilon=0.713544 Action_times=3415746 Epoche=7912\n",
      "Epsilon=0.713443 Action_times=3417188 Epoche=7913\n",
      "Epsilon=0.713384 Action_times=3418013 Epoche=7914\n",
      "Epsilon=0.713374 Action_times=3418167 Epoche=7915\n",
      "Epsilon=0.713366 Action_times=3418282 Epoche=7916\n",
      "Epsilon=0.713333 Action_times=3418739 Epoche=7917\n",
      "Epsilon=0.713304 Action_times=3419163 Epoche=7918\n",
      "Epsilon=0.713229 Action_times=3420229 Epoche=7919\n",
      "Epsilon=0.713193 Action_times=3420730 Epoche=7920\n",
      "Epsilon=0.713004 Action_times=3423418 Epoche=7921\n",
      "Epsilon=0.712939 Action_times=3424343 Epoche=7922\n",
      "Epsilon=0.712920 Action_times=3424618 Epoche=7923\n",
      "Epsilon=0.712848 Action_times=3425650 Epoche=7924\n",
      "Epsilon=0.712582 Action_times=3429429 Epoche=7925\n",
      "Epsilon=0.712504 Action_times=3430541 Epoche=7926\n",
      "Epsilon=0.712333 Action_times=3432970 Epoche=7927\n",
      "Epsilon=0.712165 Action_times=3435363 Epoche=7928\n",
      "Epsilon=0.712049 Action_times=3437017 Epoche=7929\n",
      "Epsilon=0.711970 Action_times=3438144 Epoche=7930\n",
      "Epsilon=0.711869 Action_times=3439580 Epoche=7931\n",
      "Epsilon=0.711644 Action_times=3442786 Epoche=7932\n",
      "Epsilon=0.711440 Action_times=3445695 Epoche=7933\n",
      "Epsilon=0.711413 Action_times=3446081 Epoche=7934\n",
      "Epsilon=0.711320 Action_times=3447408 Epoche=7935\n",
      "Epsilon=0.711281 Action_times=3447962 Epoche=7936\n",
      "Epsilon=0.711241 Action_times=3448531 Epoche=7937\n",
      "Epsilon=0.711193 Action_times=3449211 Epoche=7938\n",
      "Epsilon=0.711128 Action_times=3450143 Epoche=7939\n",
      "Epsilon=0.710986 Action_times=3452175 Epoche=7940\n",
      "Epsilon=0.710900 Action_times=3453399 Epoche=7941\n",
      "Epsilon=0.710875 Action_times=3453758 Epoche=7942\n",
      "Epsilon=0.710748 Action_times=3455573 Epoche=7943\n",
      "Epsilon=0.710639 Action_times=3457126 Epoche=7944\n",
      "Epsilon=0.710507 Action_times=3459006 Epoche=7945\n",
      "Epsilon=0.710366 Action_times=3461026 Epoche=7946\n",
      "Epsilon=0.710302 Action_times=3461932 Epoche=7947\n",
      "Epsilon=0.710267 Action_times=3462436 Epoche=7948\n",
      "Epsilon=0.710246 Action_times=3462733 Epoche=7949\n",
      "Epsilon=0.710135 Action_times=3464313 Epoche=7950\n",
      "Epsilon=0.710091 Action_times=3464953 Epoche=7951\n",
      "Epsilon=0.710044 Action_times=3465616 Epoche=7952\n",
      "Epsilon=0.709991 Action_times=3466376 Epoche=7953\n",
      "Epsilon=0.709920 Action_times=3467395 Epoche=7954\n",
      "Epsilon=0.709847 Action_times=3468428 Epoche=7955\n",
      "Epsilon=0.709783 Action_times=3469349 Epoche=7956\n",
      "Epsilon=0.709763 Action_times=3469638 Epoche=7957\n",
      "Epsilon=0.709689 Action_times=3470690 Epoche=7958\n",
      "Epsilon=0.709653 Action_times=3471198 Epoche=7959\n",
      "Epsilon=0.709594 Action_times=3472050 Epoche=7960\n",
      "Epsilon=0.709515 Action_times=3473172 Epoche=7961\n",
      "Epsilon=0.709344 Action_times=3475624 Epoche=7962\n",
      "Epsilon=0.709278 Action_times=3476559 Epoche=7963\n",
      "Epsilon=0.709206 Action_times=3477594 Epoche=7964\n",
      "Epsilon=0.709148 Action_times=3478428 Epoche=7965\n",
      "Epsilon=0.709064 Action_times=3479631 Epoche=7966\n",
      "Epsilon=0.709053 Action_times=3479783 Epoche=7967\n",
      "Epsilon=0.709016 Action_times=3480317 Epoche=7968\n",
      "Epsilon=0.708998 Action_times=3480574 Epoche=7969\n",
      "Epsilon=0.708952 Action_times=3481234 Epoche=7970\n",
      "Epsilon=0.708880 Action_times=3482253 Epoche=7971\n",
      "Epsilon=0.708800 Action_times=3483398 Epoche=7972\n",
      "Epsilon=0.708753 Action_times=3484074 Epoche=7973\n",
      "Epsilon=0.708631 Action_times=3485829 Epoche=7974\n",
      "Epsilon=0.708629 Action_times=3485856 Epoche=7975\n",
      "Epsilon=0.708602 Action_times=3486231 Epoche=7976\n",
      "Epsilon=0.708463 Action_times=3488222 Epoche=7977\n",
      "Epsilon=0.708406 Action_times=3489039 Epoche=7978\n",
      "Epsilon=0.708226 Action_times=3491622 Epoche=7979\n",
      "Epsilon=0.708083 Action_times=3493673 Epoche=7980\n",
      "Epsilon=0.708037 Action_times=3494324 Epoche=7981\n",
      "Epsilon=0.707941 Action_times=3495708 Epoche=7982\n",
      "Epsilon=0.707893 Action_times=3496393 Epoche=7983\n",
      "Epsilon=0.707808 Action_times=3497610 Epoche=7984\n",
      "Epsilon=0.707778 Action_times=3498046 Epoche=7985\n",
      "Epsilon=0.707747 Action_times=3498485 Epoche=7986\n",
      "Epsilon=0.707657 Action_times=3499780 Epoche=7987\n",
      "Epsilon=0.707620 Action_times=3500299 Epoche=7988\n",
      "Epsilon=0.707582 Action_times=3500844 Epoche=7989\n",
      "Epsilon=0.707466 Action_times=3502518 Epoche=7990\n",
      "Epsilon=0.707453 Action_times=3502703 Epoche=7991\n",
      "Epsilon=0.707341 Action_times=3504307 Epoche=7992\n",
      "Epsilon=0.707307 Action_times=3504786 Epoche=7993\n",
      "Epsilon=0.707275 Action_times=3505249 Epoche=7994\n",
      "Epsilon=0.707216 Action_times=3506100 Epoche=7995\n",
      "Epsilon=0.707150 Action_times=3507038 Epoche=7996\n",
      "Epsilon=0.707122 Action_times=3507439 Epoche=7997\n",
      "Epsilon=0.707055 Action_times=3508408 Epoche=7998\n",
      "Epsilon=0.707036 Action_times=3508686 Epoche=7999\n",
      "Epsilon=0.706963 Action_times=3509723 Epoche=8000\n",
      "Epsilon=0.706806 Action_times=3511986 Epoche=8001\n",
      "Epsilon=0.706726 Action_times=3513131 Epoche=8002\n",
      "Epsilon=0.706710 Action_times=3513350 Epoche=8003\n",
      "Epsilon=0.706661 Action_times=3514062 Epoche=8004\n",
      "Epsilon=0.706601 Action_times=3514918 Epoche=8005\n",
      "Epsilon=0.706483 Action_times=3516617 Epoche=8006\n",
      "Epsilon=0.706475 Action_times=3516724 Epoche=8007\n",
      "Epsilon=0.706374 Action_times=3518177 Epoche=8008\n",
      "Epsilon=0.706307 Action_times=3519150 Epoche=8009\n",
      "Epsilon=0.706258 Action_times=3519844 Epoche=8010\n",
      "Epsilon=0.706199 Action_times=3520691 Epoche=8011\n",
      "Epsilon=0.706055 Action_times=3522758 Epoche=8012\n",
      "Epsilon=0.706033 Action_times=3523076 Epoche=8013\n",
      "Epsilon=0.705928 Action_times=3524585 Epoche=8014\n",
      "Epsilon=0.705819 Action_times=3526151 Epoche=8015\n",
      "Epsilon=0.705779 Action_times=3526728 Epoche=8016\n",
      "Epsilon=0.705740 Action_times=3527287 Epoche=8017\n",
      "Epsilon=0.705667 Action_times=3528338 Epoche=8018\n",
      "Epsilon=0.705650 Action_times=3528586 Epoche=8019\n",
      "Epsilon=0.705578 Action_times=3529620 Epoche=8020\n",
      "Epsilon=0.705407 Action_times=3532070 Epoche=8021\n",
      "Epsilon=0.705361 Action_times=3532742 Epoche=8022\n",
      "Epsilon=0.705288 Action_times=3533794 Epoche=8023\n",
      "Epsilon=0.705238 Action_times=3534511 Epoche=8024\n",
      "Epsilon=0.705129 Action_times=3536077 Epoche=8025\n",
      "Epsilon=0.705082 Action_times=3536749 Epoche=8026\n",
      "Epsilon=0.704971 Action_times=3538350 Epoche=8027\n",
      "Epsilon=0.704909 Action_times=3539241 Epoche=8028\n",
      "Epsilon=0.704898 Action_times=3539396 Epoche=8029\n",
      "Epsilon=0.704842 Action_times=3540210 Epoche=8030\n",
      "Epsilon=0.704794 Action_times=3540889 Epoche=8031\n",
      "Epsilon=0.704753 Action_times=3541486 Epoche=8032\n",
      "Epsilon=0.704698 Action_times=3542274 Epoche=8033\n",
      "Epsilon=0.704584 Action_times=3543915 Epoche=8034\n",
      "Epsilon=0.704566 Action_times=3544183 Epoche=8035\n",
      "Epsilon=0.704500 Action_times=3545127 Epoche=8036\n",
      "Epsilon=0.704402 Action_times=3546541 Epoche=8037\n",
      "Epsilon=0.704311 Action_times=3547854 Epoche=8038\n",
      "Epsilon=0.704212 Action_times=3549271 Epoche=8039\n",
      "Epsilon=0.704189 Action_times=3549603 Epoche=8040\n",
      "Epsilon=0.704161 Action_times=3550005 Epoche=8041\n",
      "Epsilon=0.704124 Action_times=3550546 Epoche=8042\n",
      "Epsilon=0.704008 Action_times=3552211 Epoche=8043\n",
      "Epsilon=0.703968 Action_times=3552787 Epoche=8044\n",
      "Epsilon=0.703922 Action_times=3553450 Epoche=8045\n",
      "Epsilon=0.703870 Action_times=3554204 Epoche=8046\n",
      "Epsilon=0.703690 Action_times=3556794 Epoche=8047\n",
      "Epsilon=0.703600 Action_times=3558099 Epoche=8048\n",
      "Epsilon=0.703527 Action_times=3559152 Epoche=8049\n",
      "Epsilon=0.703504 Action_times=3559473 Epoche=8050\n",
      "Epsilon=0.703429 Action_times=3560556 Epoche=8051\n",
      "Epsilon=0.703337 Action_times=3561886 Epoche=8052\n",
      "Epsilon=0.703211 Action_times=3563704 Epoche=8053\n",
      "Epsilon=0.703101 Action_times=3565295 Epoche=8054\n",
      "Epsilon=0.702985 Action_times=3566973 Epoche=8055\n",
      "Epsilon=0.702906 Action_times=3568113 Epoche=8056\n",
      "Epsilon=0.702842 Action_times=3569031 Epoche=8057\n",
      "Epsilon=0.702621 Action_times=3572223 Epoche=8058\n",
      "Epsilon=0.702528 Action_times=3573563 Epoche=8059\n",
      "Epsilon=0.702433 Action_times=3574940 Epoche=8060\n",
      "Epsilon=0.702338 Action_times=3576308 Epoche=8061\n",
      "Epsilon=0.702284 Action_times=3577088 Epoche=8062\n",
      "Epsilon=0.702233 Action_times=3577822 Epoche=8063\n",
      "Epsilon=0.702198 Action_times=3578327 Epoche=8064\n",
      "Epsilon=0.702148 Action_times=3579053 Epoche=8065\n",
      "Epsilon=0.702072 Action_times=3580146 Epoche=8066\n",
      "Epsilon=0.701996 Action_times=3581246 Epoche=8067\n",
      "Epsilon=0.701934 Action_times=3582139 Epoche=8068\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.701820 Action_times=3583789 Epoche=8069\n",
      "Epsilon=0.701732 Action_times=3585057 Epoche=8070\n",
      "Epsilon=0.701657 Action_times=3586142 Epoche=8071\n",
      "Epsilon=0.701621 Action_times=3586666 Epoche=8072\n",
      "Epsilon=0.701596 Action_times=3587034 Epoche=8073\n",
      "Epsilon=0.701524 Action_times=3588077 Epoche=8074\n",
      "Epsilon=0.701429 Action_times=3589443 Epoche=8075\n",
      "Epsilon=0.701399 Action_times=3589884 Epoche=8076\n",
      "Epsilon=0.701320 Action_times=3591020 Epoche=8077\n",
      "Epsilon=0.701173 Action_times=3593150 Epoche=8078\n",
      "Epsilon=0.701144 Action_times=3593566 Epoche=8079\n",
      "Epsilon=0.701030 Action_times=3595214 Epoche=8080\n",
      "Epsilon=0.700958 Action_times=3596259 Epoche=8081\n",
      "Epsilon=0.700796 Action_times=3598607 Epoche=8082\n",
      "Epsilon=0.700611 Action_times=3601289 Epoche=8083\n",
      "Epsilon=0.700583 Action_times=3601683 Epoche=8084\n",
      "Epsilon=0.700559 Action_times=3602033 Epoche=8085\n",
      "Epsilon=0.700478 Action_times=3603206 Epoche=8086\n",
      "Epsilon=0.700458 Action_times=3603501 Epoche=8087\n",
      "Epsilon=0.700372 Action_times=3604747 Epoche=8088\n",
      "Epsilon=0.700320 Action_times=3605492 Epoche=8089\n",
      "Epsilon=0.700198 Action_times=3607268 Epoche=8090\n",
      "Epsilon=0.700093 Action_times=3608784 Epoche=8091\n",
      "Epsilon=0.700066 Action_times=3609176 Epoche=8092\n",
      "Epsilon=0.700065 Action_times=3609194 Epoche=8093\n",
      "Epsilon=0.700053 Action_times=3609370 Epoche=8094\n",
      "Epsilon=0.700040 Action_times=3609552 Epoche=8095\n",
      "Epsilon=0.700013 Action_times=3609939 Epoche=8096\n",
      "Epsilon=0.699884 Action_times=3611818 Epoche=8097\n",
      "Epsilon=0.699789 Action_times=3613195 Epoche=8098\n",
      "Epsilon=0.699746 Action_times=3613820 Epoche=8099\n",
      "Epsilon=0.699669 Action_times=3614930 Epoche=8100\n",
      "Epsilon=0.699599 Action_times=3615944 Epoche=8101\n",
      "Epsilon=0.699579 Action_times=3616242 Epoche=8102\n",
      "Epsilon=0.699519 Action_times=3617114 Epoche=8103\n",
      "Epsilon=0.699451 Action_times=3618098 Epoche=8104\n",
      "Epsilon=0.699391 Action_times=3618964 Epoche=8105\n",
      "Epsilon=0.699316 Action_times=3620048 Epoche=8106\n",
      "Epsilon=0.699292 Action_times=3620403 Epoche=8107\n",
      "Epsilon=0.699255 Action_times=3620940 Epoche=8108\n",
      "Epsilon=0.699223 Action_times=3621394 Epoche=8109\n",
      "Epsilon=0.699186 Action_times=3621939 Epoche=8110\n",
      "Epsilon=0.699135 Action_times=3622674 Epoche=8111\n",
      "Epsilon=0.699039 Action_times=3624072 Epoche=8112\n",
      "Epsilon=0.698996 Action_times=3624688 Epoche=8113\n",
      "Epsilon=0.698971 Action_times=3625062 Epoche=8114\n",
      "Epsilon=0.698937 Action_times=3625553 Epoche=8115\n",
      "Epsilon=0.698851 Action_times=3626802 Epoche=8116\n",
      "Epsilon=0.698693 Action_times=3629092 Epoche=8117\n",
      "Epsilon=0.698617 Action_times=3630202 Epoche=8118\n",
      "Epsilon=0.698527 Action_times=3631509 Epoche=8119\n",
      "Epsilon=0.698486 Action_times=3632102 Epoche=8120\n",
      "Epsilon=0.698367 Action_times=3633827 Epoche=8121\n",
      "Epsilon=0.698293 Action_times=3634909 Epoche=8122\n",
      "Epsilon=0.698218 Action_times=3635995 Epoche=8123\n",
      "Epsilon=0.698154 Action_times=3636916 Epoche=8124\n",
      "Epsilon=0.698110 Action_times=3637567 Epoche=8125\n",
      "Epsilon=0.698087 Action_times=3637896 Epoche=8126\n",
      "Epsilon=0.698041 Action_times=3638564 Epoche=8127\n",
      "Epsilon=0.697979 Action_times=3639471 Epoche=8128\n",
      "Epsilon=0.697973 Action_times=3639559 Epoche=8129\n",
      "Epsilon=0.697932 Action_times=3640151 Epoche=8130\n",
      "Epsilon=0.697853 Action_times=3641302 Epoche=8131\n",
      "Epsilon=0.697803 Action_times=3642019 Epoche=8132\n",
      "Epsilon=0.697713 Action_times=3643330 Epoche=8133\n",
      "Epsilon=0.697593 Action_times=3645077 Epoche=8134\n",
      "Epsilon=0.697525 Action_times=3646069 Epoche=8135\n",
      "Epsilon=0.697504 Action_times=3646378 Epoche=8136\n",
      "Epsilon=0.697417 Action_times=3647632 Epoche=8137\n",
      "Epsilon=0.697302 Action_times=3649317 Epoche=8138\n",
      "Epsilon=0.697186 Action_times=3650996 Epoche=8139\n",
      "Epsilon=0.697063 Action_times=3652788 Epoche=8140\n",
      "Epsilon=0.697010 Action_times=3653559 Epoche=8141\n",
      "Epsilon=0.696918 Action_times=3654897 Epoche=8142\n",
      "Epsilon=0.696841 Action_times=3656022 Epoche=8143\n",
      "Epsilon=0.696711 Action_times=3657918 Epoche=8144\n",
      "Epsilon=0.696596 Action_times=3659592 Epoche=8145\n",
      "Epsilon=0.696503 Action_times=3660938 Epoche=8146\n",
      "Epsilon=0.696502 Action_times=3660951 Epoche=8147\n",
      "Epsilon=0.696440 Action_times=3661865 Epoche=8148\n",
      "Epsilon=0.696396 Action_times=3662495 Epoche=8149\n",
      "Epsilon=0.696368 Action_times=3662903 Epoche=8150\n",
      "Epsilon=0.696330 Action_times=3663471 Epoche=8151\n",
      "Epsilon=0.696266 Action_times=3664392 Epoche=8152\n",
      "Epsilon=0.696209 Action_times=3665221 Epoche=8153\n",
      "Epsilon=0.696177 Action_times=3665699 Epoche=8154\n",
      "Epsilon=0.696117 Action_times=3666571 Epoche=8155\n",
      "Epsilon=0.696091 Action_times=3666945 Epoche=8156\n",
      "Epsilon=0.695973 Action_times=3668674 Epoche=8157\n",
      "Epsilon=0.695839 Action_times=3670621 Epoche=8158\n",
      "Epsilon=0.695733 Action_times=3672162 Epoche=8159\n",
      "Epsilon=0.695704 Action_times=3672582 Epoche=8160\n",
      "Epsilon=0.695700 Action_times=3672643 Epoche=8161\n",
      "Epsilon=0.695658 Action_times=3673260 Epoche=8162\n",
      "Epsilon=0.695575 Action_times=3674466 Epoche=8163\n",
      "Epsilon=0.695437 Action_times=3676480 Epoche=8164\n",
      "Epsilon=0.695361 Action_times=3677599 Epoche=8165\n",
      "Epsilon=0.695214 Action_times=3679742 Epoche=8166\n",
      "Epsilon=0.695060 Action_times=3681992 Epoche=8167\n",
      "Epsilon=0.694954 Action_times=3683538 Epoche=8168\n",
      "Epsilon=0.694912 Action_times=3684140 Epoche=8169\n",
      "Epsilon=0.694898 Action_times=3684349 Epoche=8170\n",
      "Epsilon=0.694874 Action_times=3684704 Epoche=8171\n",
      "Epsilon=0.694813 Action_times=3685588 Epoche=8172\n",
      "Epsilon=0.694756 Action_times=3686423 Epoche=8173\n",
      "Epsilon=0.694640 Action_times=3688117 Epoche=8174\n",
      "Epsilon=0.694573 Action_times=3689095 Epoche=8175\n",
      "Epsilon=0.694441 Action_times=3691027 Epoche=8176\n",
      "Epsilon=0.694310 Action_times=3692938 Epoche=8177\n",
      "Epsilon=0.694199 Action_times=3694555 Epoche=8178\n",
      "Epsilon=0.694129 Action_times=3695587 Epoche=8179\n",
      "Epsilon=0.693971 Action_times=3697894 Epoche=8180\n",
      "Epsilon=0.693889 Action_times=3699091 Epoche=8181\n",
      "Epsilon=0.693824 Action_times=3700038 Epoche=8182\n",
      "Epsilon=0.693812 Action_times=3700219 Epoche=8183\n",
      "Epsilon=0.693752 Action_times=3701103 Epoche=8184\n",
      "Epsilon=0.693675 Action_times=3702227 Epoche=8185\n",
      "Epsilon=0.693617 Action_times=3703069 Epoche=8186\n",
      "Epsilon=0.693551 Action_times=3704034 Epoche=8187\n",
      "Epsilon=0.693491 Action_times=3704921 Epoche=8188\n",
      "Epsilon=0.693429 Action_times=3705824 Epoche=8189\n",
      "Epsilon=0.693404 Action_times=3706183 Epoche=8190\n",
      "Epsilon=0.693204 Action_times=3709111 Epoche=8191\n",
      "Epsilon=0.693150 Action_times=3709899 Epoche=8192\n",
      "Epsilon=0.693121 Action_times=3710328 Epoche=8193\n",
      "Epsilon=0.693070 Action_times=3711080 Epoche=8194\n",
      "Epsilon=0.693042 Action_times=3711490 Epoche=8195\n",
      "Epsilon=0.693023 Action_times=3711769 Epoche=8196\n",
      "Epsilon=0.692951 Action_times=3712820 Epoche=8197\n",
      "Epsilon=0.692908 Action_times=3713448 Epoche=8198\n",
      "Epsilon=0.692838 Action_times=3714477 Epoche=8199\n",
      "Epsilon=0.692787 Action_times=3715214 Epoche=8200\n",
      "Epsilon=0.692737 Action_times=3715952 Epoche=8201\n",
      "Epsilon=0.692642 Action_times=3717341 Epoche=8202\n",
      "Epsilon=0.692521 Action_times=3719121 Epoche=8203\n",
      "Epsilon=0.692432 Action_times=3720420 Epoche=8204\n",
      "Epsilon=0.692360 Action_times=3721482 Epoche=8205\n",
      "Epsilon=0.692284 Action_times=3722591 Epoche=8206\n",
      "Epsilon=0.692169 Action_times=3724280 Epoche=8207\n",
      "Epsilon=0.692096 Action_times=3725348 Epoche=8208\n",
      "Epsilon=0.692035 Action_times=3726240 Epoche=8209\n",
      "Epsilon=0.691898 Action_times=3728253 Epoche=8210\n",
      "Epsilon=0.691765 Action_times=3730196 Epoche=8211\n",
      "Epsilon=0.691681 Action_times=3731426 Epoche=8212\n",
      "Epsilon=0.691649 Action_times=3731899 Epoche=8213\n",
      "Epsilon=0.691562 Action_times=3733173 Epoche=8214\n",
      "Epsilon=0.691498 Action_times=3734113 Epoche=8215\n",
      "Epsilon=0.691465 Action_times=3734602 Epoche=8216\n",
      "Epsilon=0.691401 Action_times=3735539 Epoche=8217\n",
      "Epsilon=0.691318 Action_times=3736753 Epoche=8218\n",
      "Epsilon=0.691275 Action_times=3737384 Epoche=8219\n",
      "Epsilon=0.691209 Action_times=3738353 Epoche=8220\n",
      "Epsilon=0.691104 Action_times=3739894 Epoche=8221\n",
      "Epsilon=0.691092 Action_times=3740071 Epoche=8222\n",
      "Epsilon=0.691036 Action_times=3740904 Epoche=8223\n",
      "Epsilon=0.691028 Action_times=3741017 Epoche=8224\n",
      "Epsilon=0.690978 Action_times=3741745 Epoche=8225\n",
      "Epsilon=0.690946 Action_times=3742214 Epoche=8226\n",
      "Epsilon=0.690904 Action_times=3742832 Epoche=8227\n",
      "Epsilon=0.690804 Action_times=3744299 Epoche=8228\n",
      "Epsilon=0.690745 Action_times=3745177 Epoche=8229\n",
      "Epsilon=0.690659 Action_times=3746434 Epoche=8230\n",
      "Epsilon=0.690601 Action_times=3747289 Epoche=8231\n",
      "Epsilon=0.690540 Action_times=3748178 Epoche=8232\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.690411 Action_times=3750080 Epoche=8233\n",
      "Epsilon=0.690303 Action_times=3751673 Epoche=8234\n",
      "Epsilon=0.690234 Action_times=3752678 Epoche=8235\n",
      "Epsilon=0.690114 Action_times=3754446 Epoche=8236\n",
      "Epsilon=0.689880 Action_times=3757889 Epoche=8237\n",
      "Epsilon=0.689796 Action_times=3759127 Epoche=8238\n",
      "Epsilon=0.689782 Action_times=3759322 Epoche=8239\n",
      "Epsilon=0.689717 Action_times=3760287 Epoche=8240\n",
      "Epsilon=0.689672 Action_times=3760952 Epoche=8241\n",
      "Epsilon=0.689566 Action_times=3762501 Epoche=8242\n",
      "Epsilon=0.689432 Action_times=3764483 Epoche=8243\n",
      "Epsilon=0.689415 Action_times=3764725 Epoche=8244\n",
      "Epsilon=0.689350 Action_times=3765690 Epoche=8245\n",
      "Epsilon=0.689279 Action_times=3766727 Epoche=8246\n",
      "Epsilon=0.689211 Action_times=3767735 Epoche=8247\n",
      "Epsilon=0.689128 Action_times=3768956 Epoche=8248\n",
      "Epsilon=0.689046 Action_times=3770168 Epoche=8249\n",
      "Epsilon=0.688932 Action_times=3771843 Epoche=8250\n",
      "Epsilon=0.688889 Action_times=3772466 Epoche=8251\n",
      "Epsilon=0.688853 Action_times=3773009 Epoche=8252\n",
      "Epsilon=0.688813 Action_times=3773587 Epoche=8253\n",
      "Epsilon=0.688759 Action_times=3774387 Epoche=8254\n",
      "Epsilon=0.688719 Action_times=3774979 Epoche=8255\n",
      "Epsilon=0.688662 Action_times=3775819 Epoche=8256\n",
      "Epsilon=0.688643 Action_times=3776091 Epoche=8257\n",
      "Epsilon=0.688554 Action_times=3777405 Epoche=8258\n",
      "Epsilon=0.688528 Action_times=3777793 Epoche=8259\n",
      "Epsilon=0.688496 Action_times=3778257 Epoche=8260\n",
      "Epsilon=0.688377 Action_times=3780011 Epoche=8261\n",
      "Epsilon=0.688260 Action_times=3781744 Epoche=8262\n",
      "Epsilon=0.688242 Action_times=3782005 Epoche=8263\n",
      "Epsilon=0.688233 Action_times=3782142 Epoche=8264\n",
      "Epsilon=0.688129 Action_times=3783671 Epoche=8265\n",
      "Epsilon=0.688010 Action_times=3785423 Epoche=8266\n",
      "Epsilon=0.687949 Action_times=3786323 Epoche=8267\n",
      "Epsilon=0.687918 Action_times=3786788 Epoche=8268\n",
      "Epsilon=0.687712 Action_times=3789821 Epoche=8269\n",
      "Epsilon=0.687664 Action_times=3790535 Epoche=8270\n",
      "Epsilon=0.687625 Action_times=3791109 Epoche=8271\n",
      "Epsilon=0.687556 Action_times=3792134 Epoche=8272\n",
      "Epsilon=0.687504 Action_times=3792893 Epoche=8273\n",
      "Epsilon=0.687472 Action_times=3793363 Epoche=8274\n",
      "Epsilon=0.687416 Action_times=3794195 Epoche=8275\n",
      "Epsilon=0.687354 Action_times=3795116 Epoche=8276\n",
      "Epsilon=0.687318 Action_times=3795646 Epoche=8277\n",
      "Epsilon=0.687243 Action_times=3796741 Epoche=8278\n",
      "Epsilon=0.687179 Action_times=3797700 Epoche=8279\n",
      "Epsilon=0.687075 Action_times=3799225 Epoche=8280\n",
      "Epsilon=0.687055 Action_times=3799530 Epoche=8281\n",
      "Epsilon=0.686926 Action_times=3801435 Epoche=8282\n",
      "Epsilon=0.686874 Action_times=3802193 Epoche=8283\n",
      "Epsilon=0.686833 Action_times=3802798 Epoche=8284\n",
      "Epsilon=0.686792 Action_times=3803409 Epoche=8285\n",
      "Epsilon=0.686773 Action_times=3803695 Epoche=8286\n",
      "Epsilon=0.686747 Action_times=3804075 Epoche=8287\n",
      "Epsilon=0.686712 Action_times=3804599 Epoche=8288\n",
      "Epsilon=0.686679 Action_times=3805080 Epoche=8289\n",
      "Epsilon=0.686575 Action_times=3806613 Epoche=8290\n",
      "Epsilon=0.686543 Action_times=3807093 Epoche=8291\n",
      "Epsilon=0.686455 Action_times=3808393 Epoche=8292\n",
      "Epsilon=0.686387 Action_times=3809402 Epoche=8293\n",
      "Epsilon=0.686351 Action_times=3809930 Epoche=8294\n",
      "Epsilon=0.686227 Action_times=3811762 Epoche=8295\n",
      "Epsilon=0.686132 Action_times=3813164 Epoche=8296\n",
      "Epsilon=0.685977 Action_times=3815462 Epoche=8297\n",
      "Epsilon=0.685882 Action_times=3816864 Epoche=8298\n",
      "Epsilon=0.685842 Action_times=3817450 Epoche=8299\n",
      "Epsilon=0.685713 Action_times=3819372 Epoche=8300\n",
      "Epsilon=0.685672 Action_times=3819974 Epoche=8301\n",
      "Epsilon=0.685597 Action_times=3821083 Epoche=8302\n",
      "Epsilon=0.685531 Action_times=3822064 Epoche=8303\n",
      "Epsilon=0.685436 Action_times=3823472 Epoche=8304\n",
      "Epsilon=0.685342 Action_times=3824855 Epoche=8305\n",
      "Epsilon=0.685252 Action_times=3826185 Epoche=8306\n",
      "Epsilon=0.685207 Action_times=3826851 Epoche=8307\n",
      "Epsilon=0.685129 Action_times=3828009 Epoche=8308\n",
      "Epsilon=0.685108 Action_times=3828330 Epoche=8309\n",
      "Epsilon=0.684998 Action_times=3829946 Epoche=8310\n",
      "Epsilon=0.684970 Action_times=3830367 Epoche=8311\n",
      "Epsilon=0.684946 Action_times=3830720 Epoche=8312\n",
      "Epsilon=0.684854 Action_times=3832092 Epoche=8313\n",
      "Epsilon=0.684752 Action_times=3833600 Epoche=8314\n",
      "Epsilon=0.684723 Action_times=3834024 Epoche=8315\n",
      "Epsilon=0.684498 Action_times=3837362 Epoche=8316\n",
      "Epsilon=0.684429 Action_times=3838392 Epoche=8317\n",
      "Epsilon=0.684327 Action_times=3839893 Epoche=8318\n",
      "Epsilon=0.684254 Action_times=3840985 Epoche=8319\n",
      "Epsilon=0.684165 Action_times=3842295 Epoche=8320\n",
      "Epsilon=0.684164 Action_times=3842314 Epoche=8321\n",
      "Epsilon=0.684101 Action_times=3843249 Epoche=8322\n",
      "Epsilon=0.684093 Action_times=3843368 Epoche=8323\n",
      "Epsilon=0.684004 Action_times=3844688 Epoche=8324\n",
      "Epsilon=0.683864 Action_times=3846761 Epoche=8325\n",
      "Epsilon=0.683846 Action_times=3847027 Epoche=8326\n",
      "Epsilon=0.683790 Action_times=3847867 Epoche=8327\n",
      "Epsilon=0.683736 Action_times=3848666 Epoche=8328\n",
      "Epsilon=0.683681 Action_times=3849489 Epoche=8329\n",
      "Epsilon=0.683654 Action_times=3849881 Epoche=8330\n",
      "Epsilon=0.683607 Action_times=3850578 Epoche=8331\n",
      "Epsilon=0.683464 Action_times=3852704 Epoche=8332\n",
      "Epsilon=0.683367 Action_times=3854139 Epoche=8333\n",
      "Epsilon=0.683283 Action_times=3855387 Epoche=8334\n",
      "Epsilon=0.683213 Action_times=3856439 Epoche=8335\n",
      "Epsilon=0.683169 Action_times=3857091 Epoche=8336\n",
      "Epsilon=0.683078 Action_times=3858435 Epoche=8337\n",
      "Epsilon=0.682924 Action_times=3860725 Epoche=8338\n",
      "Epsilon=0.682802 Action_times=3862543 Epoche=8339\n",
      "Epsilon=0.682732 Action_times=3863586 Epoche=8340\n",
      "Epsilon=0.682694 Action_times=3864144 Epoche=8341\n",
      "Epsilon=0.682600 Action_times=3865545 Epoche=8342\n",
      "Epsilon=0.682527 Action_times=3866620 Epoche=8343\n",
      "Epsilon=0.682488 Action_times=3867211 Epoche=8344\n",
      "Epsilon=0.682458 Action_times=3867651 Epoche=8345\n",
      "Epsilon=0.682353 Action_times=3869211 Epoche=8346\n",
      "Epsilon=0.682226 Action_times=3871103 Epoche=8347\n",
      "Epsilon=0.682026 Action_times=3874072 Epoche=8348\n",
      "Epsilon=0.681997 Action_times=3874517 Epoche=8349\n",
      "Epsilon=0.681957 Action_times=3875104 Epoche=8350\n",
      "Epsilon=0.681875 Action_times=3876322 Epoche=8351\n",
      "Epsilon=0.681822 Action_times=3877113 Epoche=8352\n",
      "Epsilon=0.681803 Action_times=3877398 Epoche=8353\n",
      "Epsilon=0.681739 Action_times=3878355 Epoche=8354\n",
      "Epsilon=0.681639 Action_times=3879835 Epoche=8355\n",
      "Epsilon=0.681563 Action_times=3880967 Epoche=8356\n",
      "Epsilon=0.681436 Action_times=3882869 Epoche=8357\n",
      "Epsilon=0.681351 Action_times=3884123 Epoche=8358\n",
      "Epsilon=0.681285 Action_times=3885117 Epoche=8359\n",
      "Epsilon=0.681094 Action_times=3887960 Epoche=8360\n",
      "Epsilon=0.681005 Action_times=3889288 Epoche=8361\n",
      "Epsilon=0.680813 Action_times=3892141 Epoche=8362\n",
      "Epsilon=0.680662 Action_times=3894397 Epoche=8363\n",
      "Epsilon=0.680567 Action_times=3895820 Epoche=8364\n",
      "Epsilon=0.680532 Action_times=3896332 Epoche=8365\n",
      "Epsilon=0.680426 Action_times=3897922 Epoche=8366\n",
      "Epsilon=0.680381 Action_times=3898580 Epoche=8367\n",
      "Epsilon=0.680335 Action_times=3899267 Epoche=8368\n",
      "Epsilon=0.680320 Action_times=3899490 Epoche=8369\n",
      "Epsilon=0.680257 Action_times=3900431 Epoche=8370\n",
      "Epsilon=0.680202 Action_times=3901259 Epoche=8371\n",
      "Epsilon=0.680120 Action_times=3902483 Epoche=8372\n",
      "Epsilon=0.680086 Action_times=3902985 Epoche=8373\n",
      "Epsilon=0.680061 Action_times=3903359 Epoche=8374\n",
      "Epsilon=0.680046 Action_times=3903585 Epoche=8375\n",
      "Epsilon=0.679964 Action_times=3904811 Epoche=8376\n",
      "Epsilon=0.679933 Action_times=3905269 Epoche=8377\n",
      "Epsilon=0.679865 Action_times=3906289 Epoche=8378\n",
      "Epsilon=0.679845 Action_times=3906582 Epoche=8379\n",
      "Epsilon=0.679768 Action_times=3907738 Epoche=8380\n",
      "Epsilon=0.679703 Action_times=3908704 Epoche=8381\n",
      "Epsilon=0.679631 Action_times=3909788 Epoche=8382\n",
      "Epsilon=0.679582 Action_times=3910514 Epoche=8383\n",
      "Epsilon=0.679512 Action_times=3911560 Epoche=8384\n",
      "Epsilon=0.679462 Action_times=3912309 Epoche=8385\n",
      "Epsilon=0.679438 Action_times=3912664 Epoche=8386\n",
      "Epsilon=0.679366 Action_times=3913738 Epoche=8387\n",
      "Epsilon=0.679358 Action_times=3913861 Epoche=8388\n",
      "Epsilon=0.679293 Action_times=3914823 Epoche=8389\n",
      "Epsilon=0.679227 Action_times=3915814 Epoche=8390\n",
      "Epsilon=0.679128 Action_times=3917293 Epoche=8391\n",
      "Epsilon=0.679058 Action_times=3918342 Epoche=8392\n",
      "Epsilon=0.678985 Action_times=3919436 Epoche=8393\n",
      "Epsilon=0.678910 Action_times=3920553 Epoche=8394\n",
      "Epsilon=0.678843 Action_times=3921562 Epoche=8395\n",
      "Epsilon=0.678773 Action_times=3922608 Epoche=8396\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.678704 Action_times=3923636 Epoche=8397\n",
      "Epsilon=0.678629 Action_times=3924755 Epoche=8398\n",
      "Epsilon=0.678589 Action_times=3925351 Epoche=8399\n",
      "Epsilon=0.678477 Action_times=3927023 Epoche=8400\n",
      "Epsilon=0.678424 Action_times=3927824 Epoche=8401\n",
      "Epsilon=0.678407 Action_times=3928076 Epoche=8402\n",
      "Epsilon=0.678262 Action_times=3930240 Epoche=8403\n",
      "Epsilon=0.678211 Action_times=3931008 Epoche=8404\n",
      "Epsilon=0.678189 Action_times=3931345 Epoche=8405\n",
      "Epsilon=0.678140 Action_times=3932066 Epoche=8406\n",
      "Epsilon=0.678050 Action_times=3933422 Epoche=8407\n",
      "Epsilon=0.677975 Action_times=3934540 Epoche=8408\n",
      "Epsilon=0.677900 Action_times=3935659 Epoche=8409\n",
      "Epsilon=0.677821 Action_times=3936845 Epoche=8410\n",
      "Epsilon=0.677757 Action_times=3937807 Epoche=8411\n",
      "Epsilon=0.677665 Action_times=3939184 Epoche=8412\n",
      "Epsilon=0.677602 Action_times=3940128 Epoche=8413\n",
      "Epsilon=0.677538 Action_times=3941093 Epoche=8414\n",
      "Epsilon=0.677526 Action_times=3941273 Epoche=8415\n",
      "Epsilon=0.677450 Action_times=3942410 Epoche=8416\n",
      "Epsilon=0.677359 Action_times=3943761 Epoche=8417\n",
      "Epsilon=0.677258 Action_times=3945279 Epoche=8418\n",
      "Epsilon=0.677130 Action_times=3947206 Epoche=8419\n",
      "Epsilon=0.676967 Action_times=3949641 Epoche=8420\n",
      "Epsilon=0.676865 Action_times=3951175 Epoche=8421\n",
      "Epsilon=0.676810 Action_times=3952005 Epoche=8422\n",
      "Epsilon=0.676588 Action_times=3955335 Epoche=8423\n",
      "Epsilon=0.676521 Action_times=3956339 Epoche=8424\n",
      "Epsilon=0.676448 Action_times=3957421 Epoche=8425\n",
      "Epsilon=0.676390 Action_times=3958298 Epoche=8426\n",
      "Epsilon=0.676300 Action_times=3959655 Epoche=8427\n",
      "Epsilon=0.676281 Action_times=3959927 Epoche=8428\n",
      "Epsilon=0.676212 Action_times=3960967 Epoche=8429\n",
      "Epsilon=0.676133 Action_times=3962155 Epoche=8430\n",
      "Epsilon=0.676054 Action_times=3963346 Epoche=8431\n",
      "Epsilon=0.676011 Action_times=3963990 Epoche=8432\n",
      "Epsilon=0.675933 Action_times=3965164 Epoche=8433\n",
      "Epsilon=0.675912 Action_times=3965471 Epoche=8434\n",
      "Epsilon=0.675846 Action_times=3966470 Epoche=8435\n",
      "Epsilon=0.675816 Action_times=3966909 Epoche=8436\n",
      "Epsilon=0.675695 Action_times=3968736 Epoche=8437\n",
      "Epsilon=0.675678 Action_times=3968994 Epoche=8438\n",
      "Epsilon=0.675630 Action_times=3969717 Epoche=8439\n",
      "Epsilon=0.675615 Action_times=3969938 Epoche=8440\n",
      "Epsilon=0.675529 Action_times=3971221 Epoche=8441\n",
      "Epsilon=0.675509 Action_times=3971523 Epoche=8442\n",
      "Epsilon=0.675389 Action_times=3973329 Epoche=8443\n",
      "Epsilon=0.675227 Action_times=3975763 Epoche=8444\n",
      "Epsilon=0.674943 Action_times=3980033 Epoche=8445\n",
      "Epsilon=0.674817 Action_times=3981936 Epoche=8446\n",
      "Epsilon=0.674709 Action_times=3983550 Epoche=8447\n",
      "Epsilon=0.674570 Action_times=3985650 Epoche=8448\n",
      "Epsilon=0.674527 Action_times=3986292 Epoche=8449\n",
      "Epsilon=0.674504 Action_times=3986633 Epoche=8450\n",
      "Epsilon=0.674501 Action_times=3986685 Epoche=8451\n",
      "Epsilon=0.674419 Action_times=3987923 Epoche=8452\n",
      "Epsilon=0.674333 Action_times=3989218 Epoche=8453\n",
      "Epsilon=0.674314 Action_times=3989497 Epoche=8454\n",
      "Epsilon=0.674205 Action_times=3991138 Epoche=8455\n",
      "Epsilon=0.674194 Action_times=3991308 Epoche=8456\n",
      "Epsilon=0.674107 Action_times=3992620 Epoche=8457\n",
      "Epsilon=0.674106 Action_times=3992628 Epoche=8458\n",
      "Epsilon=0.674043 Action_times=3993580 Epoche=8459\n",
      "Epsilon=0.674023 Action_times=3993883 Epoche=8460\n",
      "Epsilon=0.674015 Action_times=3993999 Epoche=8461\n",
      "Epsilon=0.673956 Action_times=3994898 Epoche=8462\n",
      "Epsilon=0.673841 Action_times=3996620 Epoche=8463\n",
      "Epsilon=0.673579 Action_times=4000574 Epoche=8464\n",
      "Epsilon=0.673520 Action_times=4001452 Epoche=8465\n",
      "Epsilon=0.673467 Action_times=4002259 Epoche=8466\n",
      "Epsilon=0.673414 Action_times=4003054 Epoche=8467\n",
      "Epsilon=0.673327 Action_times=4004371 Epoche=8468\n",
      "Epsilon=0.673285 Action_times=4005001 Epoche=8469\n",
      "Epsilon=0.673153 Action_times=4006998 Epoche=8470\n",
      "Epsilon=0.673069 Action_times=4008255 Epoche=8471\n",
      "Epsilon=0.672980 Action_times=4009603 Epoche=8472\n",
      "Epsilon=0.672860 Action_times=4011415 Epoche=8473\n",
      "Epsilon=0.672805 Action_times=4012248 Epoche=8474\n",
      "Epsilon=0.672727 Action_times=4013411 Epoche=8475\n",
      "Epsilon=0.672671 Action_times=4014270 Epoche=8476\n",
      "Epsilon=0.672584 Action_times=4015576 Epoche=8477\n",
      "Epsilon=0.672514 Action_times=4016627 Epoche=8478\n",
      "Epsilon=0.672458 Action_times=4017482 Epoche=8479\n",
      "Epsilon=0.672404 Action_times=4018294 Epoche=8480\n",
      "Epsilon=0.672357 Action_times=4019003 Epoche=8481\n",
      "Epsilon=0.672298 Action_times=4019898 Epoche=8482\n",
      "Epsilon=0.672275 Action_times=4020242 Epoche=8483\n",
      "Epsilon=0.672245 Action_times=4020696 Epoche=8484\n",
      "Epsilon=0.672211 Action_times=4021206 Epoche=8485\n",
      "Epsilon=0.672141 Action_times=4022269 Epoche=8486\n",
      "Epsilon=0.672124 Action_times=4022527 Epoche=8487\n",
      "Epsilon=0.672043 Action_times=4023751 Epoche=8488\n",
      "Epsilon=0.671953 Action_times=4025110 Epoche=8489\n",
      "Epsilon=0.671919 Action_times=4025620 Epoche=8490\n",
      "Epsilon=0.671833 Action_times=4026915 Epoche=8491\n",
      "Epsilon=0.671736 Action_times=4028381 Epoche=8492\n",
      "Epsilon=0.671720 Action_times=4028624 Epoche=8493\n",
      "Epsilon=0.671599 Action_times=4030457 Epoche=8494\n",
      "Epsilon=0.671547 Action_times=4031242 Epoche=8495\n",
      "Epsilon=0.671511 Action_times=4031789 Epoche=8496\n",
      "Epsilon=0.671462 Action_times=4032530 Epoche=8497\n",
      "Epsilon=0.671427 Action_times=4033046 Epoche=8498\n",
      "Epsilon=0.671333 Action_times=4034472 Epoche=8499\n",
      "Epsilon=0.671303 Action_times=4034922 Epoche=8500\n",
      "Epsilon=0.671234 Action_times=4035970 Epoche=8501\n",
      "Epsilon=0.671169 Action_times=4036956 Epoche=8502\n",
      "Epsilon=0.671149 Action_times=4037260 Epoche=8503\n",
      "Epsilon=0.671078 Action_times=4038326 Epoche=8504\n",
      "Epsilon=0.670994 Action_times=4039596 Epoche=8505\n",
      "Epsilon=0.670893 Action_times=4041126 Epoche=8506\n",
      "Epsilon=0.670797 Action_times=4042587 Epoche=8507\n",
      "Epsilon=0.670718 Action_times=4043775 Epoche=8508\n",
      "Epsilon=0.670689 Action_times=4044213 Epoche=8509\n",
      "Epsilon=0.670591 Action_times=4045693 Epoche=8510\n",
      "Epsilon=0.670534 Action_times=4046564 Epoche=8511\n",
      "Epsilon=0.670453 Action_times=4047792 Epoche=8512\n",
      "Epsilon=0.670439 Action_times=4048001 Epoche=8513\n",
      "Epsilon=0.670396 Action_times=4048651 Epoche=8514\n",
      "Epsilon=0.670223 Action_times=4051277 Epoche=8515\n",
      "Epsilon=0.670119 Action_times=4052844 Epoche=8516\n",
      "Epsilon=0.670046 Action_times=4053947 Epoche=8517\n",
      "Epsilon=0.670013 Action_times=4054461 Epoche=8518\n",
      "Epsilon=0.669970 Action_times=4055107 Epoche=8519\n",
      "Epsilon=0.669937 Action_times=4055601 Epoche=8520\n",
      "Epsilon=0.669886 Action_times=4056379 Epoche=8521\n",
      "Epsilon=0.669798 Action_times=4057710 Epoche=8522\n",
      "Epsilon=0.669749 Action_times=4058461 Epoche=8523\n",
      "Epsilon=0.669720 Action_times=4058897 Epoche=8524\n",
      "Epsilon=0.669651 Action_times=4059937 Epoche=8525\n",
      "Epsilon=0.669586 Action_times=4060922 Epoche=8526\n",
      "Epsilon=0.669485 Action_times=4062464 Epoche=8527\n",
      "Epsilon=0.669441 Action_times=4063122 Epoche=8528\n",
      "Epsilon=0.669393 Action_times=4063850 Epoche=8529\n",
      "Epsilon=0.669286 Action_times=4065475 Epoche=8530\n",
      "Epsilon=0.669251 Action_times=4066011 Epoche=8531\n",
      "Epsilon=0.669173 Action_times=4067196 Epoche=8532\n",
      "Epsilon=0.669055 Action_times=4068978 Epoche=8533\n",
      "Epsilon=0.668995 Action_times=4069894 Epoche=8534\n",
      "Epsilon=0.668974 Action_times=4070211 Epoche=8535\n",
      "Epsilon=0.668949 Action_times=4070591 Epoche=8536\n",
      "Epsilon=0.668856 Action_times=4071992 Epoche=8537\n",
      "Epsilon=0.668791 Action_times=4072979 Epoche=8538\n",
      "Epsilon=0.668727 Action_times=4073960 Epoche=8539\n",
      "Epsilon=0.668649 Action_times=4075138 Epoche=8540\n",
      "Epsilon=0.668574 Action_times=4076283 Epoche=8541\n",
      "Epsilon=0.668499 Action_times=4077421 Epoche=8542\n",
      "Epsilon=0.668471 Action_times=4077849 Epoche=8543\n",
      "Epsilon=0.668371 Action_times=4079361 Epoche=8544\n",
      "Epsilon=0.668252 Action_times=4081174 Epoche=8545\n",
      "Epsilon=0.668212 Action_times=4081784 Epoche=8546\n",
      "Epsilon=0.668178 Action_times=4082292 Epoche=8547\n",
      "Epsilon=0.668008 Action_times=4084880 Epoche=8548\n",
      "Epsilon=0.667944 Action_times=4085846 Epoche=8549\n",
      "Epsilon=0.667871 Action_times=4086966 Epoche=8550\n",
      "Epsilon=0.667738 Action_times=4088977 Epoche=8551\n",
      "Epsilon=0.667663 Action_times=4090120 Epoche=8552\n",
      "Epsilon=0.667641 Action_times=4090455 Epoche=8553\n",
      "Epsilon=0.667590 Action_times=4091234 Epoche=8554\n",
      "Epsilon=0.667489 Action_times=4092770 Epoche=8555\n",
      "Epsilon=0.667412 Action_times=4093940 Epoche=8556\n",
      "Epsilon=0.667356 Action_times=4094799 Epoche=8557\n",
      "Epsilon=0.667325 Action_times=4095263 Epoche=8558\n",
      "Epsilon=0.667221 Action_times=4096840 Epoche=8559\n",
      "Epsilon=0.667190 Action_times=4097318 Epoche=8560\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.667153 Action_times=4097874 Epoche=8561\n",
      "Epsilon=0.667096 Action_times=4098746 Epoche=8562\n",
      "Epsilon=0.667034 Action_times=4099686 Epoche=8563\n",
      "Epsilon=0.666996 Action_times=4100271 Epoche=8564\n",
      "Epsilon=0.666938 Action_times=4101150 Epoche=8565\n",
      "Epsilon=0.666904 Action_times=4101665 Epoche=8566\n",
      "Epsilon=0.666901 Action_times=4101710 Epoche=8567\n",
      "Epsilon=0.666872 Action_times=4102160 Epoche=8568\n",
      "Epsilon=0.666838 Action_times=4102672 Epoche=8569\n",
      "Epsilon=0.666713 Action_times=4104583 Epoche=8570\n",
      "Epsilon=0.666665 Action_times=4105317 Epoche=8571\n",
      "Epsilon=0.666584 Action_times=4106546 Epoche=8572\n",
      "Epsilon=0.666502 Action_times=4107785 Epoche=8573\n",
      "Epsilon=0.666410 Action_times=4109191 Epoche=8574\n",
      "Epsilon=0.666342 Action_times=4110226 Epoche=8575\n",
      "Epsilon=0.666218 Action_times=4112118 Epoche=8576\n",
      "Epsilon=0.666212 Action_times=4112215 Epoche=8577\n",
      "Epsilon=0.666136 Action_times=4113375 Epoche=8578\n",
      "Epsilon=0.666082 Action_times=4114188 Epoche=8579\n",
      "Epsilon=0.666018 Action_times=4115161 Epoche=8580\n",
      "Epsilon=0.665854 Action_times=4117667 Epoche=8581\n",
      "Epsilon=0.665793 Action_times=4118602 Epoche=8582\n",
      "Epsilon=0.665758 Action_times=4119137 Epoche=8583\n",
      "Epsilon=0.665717 Action_times=4119754 Epoche=8584\n",
      "Epsilon=0.665687 Action_times=4120209 Epoche=8585\n",
      "Epsilon=0.665583 Action_times=4121799 Epoche=8586\n",
      "Epsilon=0.665466 Action_times=4123592 Epoche=8587\n",
      "Epsilon=0.665426 Action_times=4124188 Epoche=8588\n",
      "Epsilon=0.665284 Action_times=4126357 Epoche=8589\n",
      "Epsilon=0.665212 Action_times=4127466 Epoche=8590\n",
      "Epsilon=0.665123 Action_times=4128813 Epoche=8591\n",
      "Epsilon=0.665060 Action_times=4129774 Epoche=8592\n",
      "Epsilon=0.664979 Action_times=4131025 Epoche=8593\n",
      "Epsilon=0.664848 Action_times=4133020 Epoche=8594\n",
      "Epsilon=0.664803 Action_times=4133699 Epoche=8595\n",
      "Epsilon=0.664742 Action_times=4134634 Epoche=8596\n",
      "Epsilon=0.664706 Action_times=4135194 Epoche=8597\n",
      "Epsilon=0.664662 Action_times=4135865 Epoche=8598\n",
      "Epsilon=0.664612 Action_times=4136624 Epoche=8599\n",
      "Epsilon=0.664598 Action_times=4136843 Epoche=8600\n",
      "Epsilon=0.664506 Action_times=4138239 Epoche=8601\n",
      "Epsilon=0.664422 Action_times=4139530 Epoche=8602\n",
      "Epsilon=0.664386 Action_times=4140081 Epoche=8603\n",
      "Epsilon=0.664310 Action_times=4141233 Epoche=8604\n",
      "Epsilon=0.664280 Action_times=4141689 Epoche=8605\n",
      "Epsilon=0.664204 Action_times=4142864 Epoche=8606\n",
      "Epsilon=0.664130 Action_times=4143990 Epoche=8607\n",
      "Epsilon=0.664069 Action_times=4144917 Epoche=8608\n",
      "Epsilon=0.664025 Action_times=4145594 Epoche=8609\n",
      "Epsilon=0.663953 Action_times=4146688 Epoche=8610\n",
      "Epsilon=0.663869 Action_times=4147980 Epoche=8611\n",
      "Epsilon=0.663849 Action_times=4148290 Epoche=8612\n",
      "Epsilon=0.663789 Action_times=4149205 Epoche=8613\n",
      "Epsilon=0.663701 Action_times=4150553 Epoche=8614\n",
      "Epsilon=0.663681 Action_times=4150858 Epoche=8615\n",
      "Epsilon=0.663613 Action_times=4151893 Epoche=8616\n",
      "Epsilon=0.663553 Action_times=4152813 Epoche=8617\n",
      "Epsilon=0.663497 Action_times=4153664 Epoche=8618\n",
      "Epsilon=0.663432 Action_times=4154668 Epoche=8619\n",
      "Epsilon=0.663401 Action_times=4155139 Epoche=8620\n",
      "Epsilon=0.663387 Action_times=4155355 Epoche=8621\n",
      "Epsilon=0.663338 Action_times=4156111 Epoche=8622\n",
      "Epsilon=0.663289 Action_times=4156853 Epoche=8623\n",
      "Epsilon=0.663272 Action_times=4157110 Epoche=8624\n",
      "Epsilon=0.663194 Action_times=4158304 Epoche=8625\n",
      "Epsilon=0.663152 Action_times=4158944 Epoche=8626\n",
      "Epsilon=0.663147 Action_times=4159023 Epoche=8627\n",
      "Epsilon=0.663052 Action_times=4160481 Epoche=8628\n",
      "Epsilon=0.663010 Action_times=4161120 Epoche=8629\n",
      "Epsilon=0.662953 Action_times=4161992 Epoche=8630\n",
      "Epsilon=0.662866 Action_times=4163336 Epoche=8631\n",
      "Epsilon=0.662746 Action_times=4165163 Epoche=8632\n",
      "Epsilon=0.662604 Action_times=4167338 Epoche=8633\n",
      "Epsilon=0.662583 Action_times=4167673 Epoche=8634\n",
      "Epsilon=0.662529 Action_times=4168491 Epoche=8635\n",
      "Epsilon=0.662473 Action_times=4169351 Epoche=8636\n",
      "Epsilon=0.662395 Action_times=4170548 Epoche=8637\n",
      "Epsilon=0.662248 Action_times=4172797 Epoche=8638\n",
      "Epsilon=0.662205 Action_times=4173459 Epoche=8639\n",
      "Epsilon=0.662162 Action_times=4174118 Epoche=8640\n",
      "Epsilon=0.662125 Action_times=4174687 Epoche=8641\n",
      "Epsilon=0.662113 Action_times=4174876 Epoche=8642\n",
      "Epsilon=0.662005 Action_times=4176534 Epoche=8643\n",
      "Epsilon=0.661893 Action_times=4178238 Epoche=8644\n",
      "Epsilon=0.661841 Action_times=4179046 Epoche=8645\n",
      "Epsilon=0.661836 Action_times=4179113 Epoche=8646\n",
      "Epsilon=0.661775 Action_times=4180059 Epoche=8647\n",
      "Epsilon=0.661650 Action_times=4181972 Epoche=8648\n",
      "Epsilon=0.661522 Action_times=4183937 Epoche=8649\n",
      "Epsilon=0.661498 Action_times=4184306 Epoche=8650\n",
      "Epsilon=0.661472 Action_times=4184710 Epoche=8651\n",
      "Epsilon=0.661447 Action_times=4185086 Epoche=8652\n",
      "Epsilon=0.661412 Action_times=4185629 Epoche=8653\n",
      "Epsilon=0.661394 Action_times=4185908 Epoche=8654\n",
      "Epsilon=0.661346 Action_times=4186646 Epoche=8655\n",
      "Epsilon=0.661301 Action_times=4187326 Epoche=8656\n",
      "Epsilon=0.661245 Action_times=4188195 Epoche=8657\n",
      "Epsilon=0.661208 Action_times=4188751 Epoche=8658\n",
      "Epsilon=0.661179 Action_times=4189208 Epoche=8659\n",
      "Epsilon=0.661130 Action_times=4189953 Epoche=8660\n",
      "Epsilon=0.660998 Action_times=4191980 Epoche=8661\n",
      "Epsilon=0.660964 Action_times=4192508 Epoche=8662\n",
      "Epsilon=0.660874 Action_times=4193895 Epoche=8663\n",
      "Epsilon=0.660714 Action_times=4196354 Epoche=8664\n",
      "Epsilon=0.660632 Action_times=4197601 Epoche=8665\n",
      "Epsilon=0.660612 Action_times=4197912 Epoche=8666\n",
      "Epsilon=0.660591 Action_times=4198242 Epoche=8667\n",
      "Epsilon=0.660537 Action_times=4199064 Epoche=8668\n",
      "Epsilon=0.660484 Action_times=4199883 Epoche=8669\n",
      "Epsilon=0.660451 Action_times=4200397 Epoche=8670\n",
      "Epsilon=0.660437 Action_times=4200605 Epoche=8671\n",
      "Epsilon=0.660366 Action_times=4201702 Epoche=8672\n",
      "Epsilon=0.660227 Action_times=4203840 Epoche=8673\n",
      "Epsilon=0.660059 Action_times=4206414 Epoche=8674\n",
      "Epsilon=0.660017 Action_times=4207057 Epoche=8675\n",
      "Epsilon=0.659935 Action_times=4208325 Epoche=8676\n",
      "Epsilon=0.659911 Action_times=4208695 Epoche=8677\n",
      "Epsilon=0.659849 Action_times=4209655 Epoche=8678\n",
      "Epsilon=0.659820 Action_times=4210102 Epoche=8679\n",
      "Epsilon=0.659772 Action_times=4210841 Epoche=8680\n",
      "Epsilon=0.659714 Action_times=4211727 Epoche=8681\n",
      "Epsilon=0.659669 Action_times=4212417 Epoche=8682\n",
      "Epsilon=0.659605 Action_times=4213410 Epoche=8683\n",
      "Epsilon=0.659540 Action_times=4214401 Epoche=8684\n",
      "Epsilon=0.659460 Action_times=4215639 Epoche=8685\n",
      "Epsilon=0.659394 Action_times=4216654 Epoche=8686\n",
      "Epsilon=0.659359 Action_times=4217191 Epoche=8687\n",
      "Epsilon=0.659288 Action_times=4218289 Epoche=8688\n",
      "Epsilon=0.659277 Action_times=4218453 Epoche=8689\n",
      "Epsilon=0.659215 Action_times=4219414 Epoche=8690\n",
      "Epsilon=0.659121 Action_times=4220852 Epoche=8691\n",
      "Epsilon=0.659078 Action_times=4221522 Epoche=8692\n",
      "Epsilon=0.659024 Action_times=4222359 Epoche=8693\n",
      "Epsilon=0.658905 Action_times=4224188 Epoche=8694\n",
      "Epsilon=0.658866 Action_times=4224793 Epoche=8695\n",
      "Epsilon=0.658797 Action_times=4225854 Epoche=8696\n",
      "Epsilon=0.658702 Action_times=4227318 Epoche=8697\n",
      "Epsilon=0.658637 Action_times=4228313 Epoche=8698\n",
      "Epsilon=0.658563 Action_times=4229459 Epoche=8699\n",
      "Epsilon=0.658473 Action_times=4230847 Epoche=8700\n",
      "Epsilon=0.658466 Action_times=4230950 Epoche=8701\n",
      "Epsilon=0.658399 Action_times=4231984 Epoche=8702\n",
      "Epsilon=0.658374 Action_times=4232374 Epoche=8703\n",
      "Epsilon=0.658337 Action_times=4232938 Epoche=8704\n",
      "Epsilon=0.658298 Action_times=4233541 Epoche=8705\n",
      "Epsilon=0.658218 Action_times=4234778 Epoche=8706\n",
      "Epsilon=0.658163 Action_times=4235621 Epoche=8707\n",
      "Epsilon=0.658104 Action_times=4236537 Epoche=8708\n",
      "Epsilon=0.658092 Action_times=4236720 Epoche=8709\n",
      "Epsilon=0.658070 Action_times=4237055 Epoche=8710\n",
      "Epsilon=0.658039 Action_times=4237543 Epoche=8711\n",
      "Epsilon=0.657955 Action_times=4238833 Epoche=8712\n",
      "Epsilon=0.657938 Action_times=4239102 Epoche=8713\n",
      "Epsilon=0.657876 Action_times=4240051 Epoche=8714\n",
      "Epsilon=0.657845 Action_times=4240532 Epoche=8715\n",
      "Epsilon=0.657770 Action_times=4241686 Epoche=8716\n",
      "Epsilon=0.657707 Action_times=4242664 Epoche=8717\n",
      "Epsilon=0.657666 Action_times=4243295 Epoche=8718\n",
      "Epsilon=0.657580 Action_times=4244624 Epoche=8719\n",
      "Epsilon=0.657510 Action_times=4245700 Epoche=8720\n",
      "Epsilon=0.657508 Action_times=4245745 Epoche=8721\n",
      "Epsilon=0.657372 Action_times=4247831 Epoche=8722\n",
      "Epsilon=0.657352 Action_times=4248151 Epoche=8723\n",
      "Epsilon=0.657309 Action_times=4248813 Epoche=8724\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.657236 Action_times=4249934 Epoche=8725\n",
      "Epsilon=0.657222 Action_times=4250150 Epoche=8726\n",
      "Epsilon=0.657130 Action_times=4251581 Epoche=8727\n",
      "Epsilon=0.657060 Action_times=4252666 Epoche=8728\n",
      "Epsilon=0.656977 Action_times=4253940 Epoche=8729\n",
      "Epsilon=0.656968 Action_times=4254082 Epoche=8730\n",
      "Epsilon=0.656878 Action_times=4255478 Epoche=8731\n",
      "Epsilon=0.656842 Action_times=4256028 Epoche=8732\n",
      "Epsilon=0.656707 Action_times=4258118 Epoche=8733\n",
      "Epsilon=0.656623 Action_times=4259418 Epoche=8734\n",
      "Epsilon=0.656501 Action_times=4261296 Epoche=8735\n",
      "Epsilon=0.656468 Action_times=4261807 Epoche=8736\n",
      "Epsilon=0.656309 Action_times=4264279 Epoche=8737\n",
      "Epsilon=0.656178 Action_times=4266307 Epoche=8738\n",
      "Epsilon=0.656116 Action_times=4267255 Epoche=8739\n",
      "Epsilon=0.656079 Action_times=4267830 Epoche=8740\n",
      "Epsilon=0.655945 Action_times=4269909 Epoche=8741\n",
      "Epsilon=0.655859 Action_times=4271231 Epoche=8742\n",
      "Epsilon=0.655776 Action_times=4272521 Epoche=8743\n",
      "Epsilon=0.655689 Action_times=4273871 Epoche=8744\n",
      "Epsilon=0.655622 Action_times=4274906 Epoche=8745\n",
      "Epsilon=0.655505 Action_times=4276723 Epoche=8746\n",
      "Epsilon=0.655429 Action_times=4277899 Epoche=8747\n",
      "Epsilon=0.655386 Action_times=4278558 Epoche=8748\n",
      "Epsilon=0.655292 Action_times=4280021 Epoche=8749\n",
      "Epsilon=0.655275 Action_times=4280278 Epoche=8750\n",
      "Epsilon=0.655194 Action_times=4281538 Epoche=8751\n",
      "Epsilon=0.655156 Action_times=4282131 Epoche=8752\n",
      "Epsilon=0.655085 Action_times=4283224 Epoche=8753\n",
      "Epsilon=0.655084 Action_times=4283250 Epoche=8754\n",
      "Epsilon=0.654995 Action_times=4284617 Epoche=8755\n",
      "Epsilon=0.654876 Action_times=4286473 Epoche=8756\n",
      "Epsilon=0.654846 Action_times=4286939 Epoche=8757\n",
      "Epsilon=0.654752 Action_times=4288390 Epoche=8758\n",
      "Epsilon=0.654712 Action_times=4289008 Epoche=8759\n",
      "Epsilon=0.654698 Action_times=4289235 Epoche=8760\n",
      "Epsilon=0.654508 Action_times=4292177 Epoche=8761\n",
      "Epsilon=0.654465 Action_times=4292851 Epoche=8762\n",
      "Epsilon=0.654352 Action_times=4294594 Epoche=8763\n",
      "Epsilon=0.654223 Action_times=4296594 Epoche=8764\n",
      "Epsilon=0.654199 Action_times=4296966 Epoche=8765\n",
      "Epsilon=0.654178 Action_times=4297291 Epoche=8766\n",
      "Epsilon=0.654075 Action_times=4298895 Epoche=8767\n",
      "Epsilon=0.654028 Action_times=4299631 Epoche=8768\n",
      "Epsilon=0.653990 Action_times=4300213 Epoche=8769\n",
      "Epsilon=0.653960 Action_times=4300680 Epoche=8770\n",
      "Epsilon=0.653901 Action_times=4301594 Epoche=8771\n",
      "Epsilon=0.653797 Action_times=4303218 Epoche=8772\n",
      "Epsilon=0.653680 Action_times=4305036 Epoche=8773\n",
      "Epsilon=0.653604 Action_times=4306217 Epoche=8774\n",
      "Epsilon=0.653582 Action_times=4306553 Epoche=8775\n",
      "Epsilon=0.653561 Action_times=4306883 Epoche=8776\n",
      "Epsilon=0.653517 Action_times=4307561 Epoche=8777\n",
      "Epsilon=0.653483 Action_times=4308090 Epoche=8778\n",
      "Epsilon=0.653414 Action_times=4309159 Epoche=8779\n",
      "Epsilon=0.653328 Action_times=4310501 Epoche=8780\n",
      "Epsilon=0.653308 Action_times=4310814 Epoche=8781\n",
      "Epsilon=0.653209 Action_times=4312345 Epoche=8782\n",
      "Epsilon=0.653153 Action_times=4313228 Epoche=8783\n",
      "Epsilon=0.653142 Action_times=4313388 Epoche=8784\n",
      "Epsilon=0.653090 Action_times=4314209 Epoche=8785\n",
      "Epsilon=0.653001 Action_times=4315586 Epoche=8786\n",
      "Epsilon=0.652987 Action_times=4315803 Epoche=8787\n",
      "Epsilon=0.652932 Action_times=4316662 Epoche=8788\n",
      "Epsilon=0.652795 Action_times=4318790 Epoche=8789\n",
      "Epsilon=0.652720 Action_times=4319955 Epoche=8790\n",
      "Epsilon=0.652625 Action_times=4321433 Epoche=8791\n",
      "Epsilon=0.652541 Action_times=4322742 Epoche=8792\n",
      "Epsilon=0.652464 Action_times=4323944 Epoche=8793\n",
      "Epsilon=0.652437 Action_times=4324362 Epoche=8794\n",
      "Epsilon=0.652401 Action_times=4324922 Epoche=8795\n",
      "Epsilon=0.652356 Action_times=4325618 Epoche=8796\n",
      "Epsilon=0.652309 Action_times=4326352 Epoche=8797\n",
      "Epsilon=0.652290 Action_times=4326644 Epoche=8798\n",
      "Epsilon=0.652191 Action_times=4328189 Epoche=8799\n",
      "Epsilon=0.652118 Action_times=4329329 Epoche=8800\n",
      "Epsilon=0.651992 Action_times=4331295 Epoche=8801\n",
      "Epsilon=0.651922 Action_times=4332380 Epoche=8802\n",
      "Epsilon=0.651836 Action_times=4333719 Epoche=8803\n",
      "Epsilon=0.651787 Action_times=4334482 Epoche=8804\n",
      "Epsilon=0.651751 Action_times=4335039 Epoche=8805\n",
      "Epsilon=0.651685 Action_times=4336078 Epoche=8806\n",
      "Epsilon=0.651572 Action_times=4337832 Epoche=8807\n",
      "Epsilon=0.651520 Action_times=4338653 Epoche=8808\n",
      "Epsilon=0.651476 Action_times=4339335 Epoche=8809\n",
      "Epsilon=0.651428 Action_times=4340079 Epoche=8810\n",
      "Epsilon=0.651406 Action_times=4340426 Epoche=8811\n",
      "Epsilon=0.651351 Action_times=4341284 Epoche=8812\n",
      "Epsilon=0.651300 Action_times=4342077 Epoche=8813\n",
      "Epsilon=0.651255 Action_times=4342771 Epoche=8814\n",
      "Epsilon=0.651134 Action_times=4344657 Epoche=8815\n",
      "Epsilon=0.651110 Action_times=4345045 Epoche=8816\n",
      "Epsilon=0.650976 Action_times=4347122 Epoche=8817\n",
      "Epsilon=0.650919 Action_times=4348020 Epoche=8818\n",
      "Epsilon=0.650875 Action_times=4348701 Epoche=8819\n",
      "Epsilon=0.650839 Action_times=4349263 Epoche=8820\n",
      "Epsilon=0.650687 Action_times=4351639 Epoche=8821\n",
      "Epsilon=0.650576 Action_times=4353374 Epoche=8822\n",
      "Epsilon=0.650432 Action_times=4355626 Epoche=8823\n",
      "Epsilon=0.650364 Action_times=4356682 Epoche=8824\n",
      "Epsilon=0.650272 Action_times=4358125 Epoche=8825\n",
      "Epsilon=0.650226 Action_times=4358843 Epoche=8826\n",
      "Epsilon=0.650185 Action_times=4359471 Epoche=8827\n",
      "Epsilon=0.650148 Action_times=4360051 Epoche=8828\n",
      "Epsilon=0.650078 Action_times=4361154 Epoche=8829\n",
      "Epsilon=0.650019 Action_times=4362063 Epoche=8830\n",
      "Epsilon=0.649948 Action_times=4363188 Epoche=8831\n",
      "Epsilon=0.649890 Action_times=4364087 Epoche=8832\n",
      "Epsilon=0.649853 Action_times=4364659 Epoche=8833\n",
      "Epsilon=0.649810 Action_times=4365337 Epoche=8834\n",
      "Epsilon=0.649795 Action_times=4365564 Epoche=8835\n",
      "Epsilon=0.649728 Action_times=4366613 Epoche=8836\n",
      "Epsilon=0.649567 Action_times=4369132 Epoche=8837\n",
      "Epsilon=0.649513 Action_times=4369973 Epoche=8838\n",
      "Epsilon=0.649432 Action_times=4371250 Epoche=8839\n",
      "Epsilon=0.649306 Action_times=4373223 Epoche=8840\n",
      "Epsilon=0.649231 Action_times=4374395 Epoche=8841\n",
      "Epsilon=0.649193 Action_times=4374990 Epoche=8842\n",
      "Epsilon=0.649143 Action_times=4375773 Epoche=8843\n",
      "Epsilon=0.649073 Action_times=4376870 Epoche=8844\n",
      "Epsilon=0.648962 Action_times=4378607 Epoche=8845\n",
      "Epsilon=0.648870 Action_times=4380038 Epoche=8846\n",
      "Epsilon=0.648710 Action_times=4382550 Epoche=8847\n",
      "Epsilon=0.648647 Action_times=4383536 Epoche=8848\n",
      "Epsilon=0.648631 Action_times=4383780 Epoche=8849\n",
      "Epsilon=0.648597 Action_times=4384308 Epoche=8850\n",
      "Epsilon=0.648583 Action_times=4384533 Epoche=8851\n",
      "Epsilon=0.648504 Action_times=4385772 Epoche=8852\n",
      "Epsilon=0.648419 Action_times=4387097 Epoche=8853\n",
      "Epsilon=0.648346 Action_times=4388245 Epoche=8854\n",
      "Epsilon=0.648340 Action_times=4388338 Epoche=8855\n",
      "Epsilon=0.648282 Action_times=4389249 Epoche=8856\n",
      "Epsilon=0.648199 Action_times=4390545 Epoche=8857\n",
      "Epsilon=0.648120 Action_times=4391789 Epoche=8858\n",
      "Epsilon=0.648057 Action_times=4392772 Epoche=8859\n",
      "Epsilon=0.648035 Action_times=4393118 Epoche=8860\n",
      "Epsilon=0.647990 Action_times=4393828 Epoche=8861\n",
      "Epsilon=0.647866 Action_times=4395774 Epoche=8862\n",
      "Epsilon=0.647758 Action_times=4397468 Epoche=8863\n",
      "Epsilon=0.647736 Action_times=4397811 Epoche=8864\n",
      "Epsilon=0.647701 Action_times=4398351 Epoche=8865\n",
      "Epsilon=0.647643 Action_times=4399266 Epoche=8866\n",
      "Epsilon=0.647596 Action_times=4400008 Epoche=8867\n",
      "Epsilon=0.647506 Action_times=4401410 Epoche=8868\n",
      "Epsilon=0.647459 Action_times=4402142 Epoche=8869\n",
      "Epsilon=0.647411 Action_times=4402906 Epoche=8870\n",
      "Epsilon=0.647367 Action_times=4403590 Epoche=8871\n",
      "Epsilon=0.647318 Action_times=4404366 Epoche=8872\n",
      "Epsilon=0.647255 Action_times=4405343 Epoche=8873\n",
      "Epsilon=0.647193 Action_times=4406322 Epoche=8874\n",
      "Epsilon=0.647130 Action_times=4407307 Epoche=8875\n",
      "Epsilon=0.647088 Action_times=4407971 Epoche=8876\n",
      "Epsilon=0.647020 Action_times=4409035 Epoche=8877\n",
      "Epsilon=0.646976 Action_times=4409728 Epoche=8878\n",
      "Epsilon=0.646922 Action_times=4410575 Epoche=8879\n",
      "Epsilon=0.646912 Action_times=4410735 Epoche=8880\n",
      "Epsilon=0.646829 Action_times=4412039 Epoche=8881\n",
      "Epsilon=0.646737 Action_times=4413484 Epoche=8882\n",
      "Epsilon=0.646692 Action_times=4414197 Epoche=8883\n",
      "Epsilon=0.646663 Action_times=4414646 Epoche=8884\n",
      "Epsilon=0.646651 Action_times=4414826 Epoche=8885\n",
      "Epsilon=0.646641 Action_times=4414984 Epoche=8886\n",
      "Epsilon=0.646611 Action_times=4415461 Epoche=8887\n",
      "Epsilon=0.646598 Action_times=4415669 Epoche=8888\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epsilon=0.646545 Action_times=4416504 Epoche=8889\n",
      "Epsilon=0.646496 Action_times=4417269 Epoche=8890\n",
      "Epsilon=0.646472 Action_times=4417653 Epoche=8891\n",
      "Epsilon=0.646422 Action_times=4418429 Epoche=8892\n",
      "Epsilon=0.646284 Action_times=4420607 Epoche=8893\n",
      "Epsilon=0.646263 Action_times=4420929 Epoche=8894\n",
      "Epsilon=0.646237 Action_times=4421339 Epoche=8895\n",
      "Epsilon=0.646216 Action_times=4421665 Epoche=8896\n",
      "Epsilon=0.646154 Action_times=4422637 Epoche=8897\n",
      "Epsilon=0.646134 Action_times=4422960 Epoche=8898\n",
      "Epsilon=0.646040 Action_times=4424440 Epoche=8899\n",
      "Epsilon=0.645987 Action_times=4425261 Epoche=8900\n",
      "Epsilon=0.645953 Action_times=4425804 Epoche=8901\n",
      "Epsilon=0.645898 Action_times=4426660 Epoche=8902\n",
      "Epsilon=0.645842 Action_times=4427549 Epoche=8903\n",
      "Epsilon=0.645796 Action_times=4428271 Epoche=8904\n",
      "Epsilon=0.645700 Action_times=4429785 Epoche=8905\n",
      "Epsilon=0.645598 Action_times=4431387 Epoche=8906\n",
      "Epsilon=0.645583 Action_times=4431627 Epoche=8907\n",
      "Epsilon=0.645474 Action_times=4433334 Epoche=8908\n",
      "Epsilon=0.645393 Action_times=4434612 Epoche=8909\n",
      "Epsilon=0.645351 Action_times=4435275 Epoche=8910\n",
      "Epsilon=0.645331 Action_times=4435582 Epoche=8911\n",
      "Epsilon=0.645310 Action_times=4435914 Epoche=8912\n",
      "Epsilon=0.645282 Action_times=4436361 Epoche=8913\n",
      "Epsilon=0.645201 Action_times=4437633 Epoche=8914\n",
      "Epsilon=0.645094 Action_times=4439323 Epoche=8915\n",
      "Epsilon=0.645058 Action_times=4439881 Epoche=8916\n",
      "Epsilon=0.645018 Action_times=4440521 Epoche=8917\n",
      "Epsilon=0.644925 Action_times=4441985 Epoche=8918\n",
      "Epsilon=0.644898 Action_times=4442402 Epoche=8919\n",
      "Epsilon=0.644868 Action_times=4442879 Epoche=8920\n",
      "Epsilon=0.644742 Action_times=4444870 Epoche=8921\n",
      "Epsilon=0.644654 Action_times=4446256 Epoche=8922\n",
      "Epsilon=0.644611 Action_times=4446933 Epoche=8923\n",
      "Epsilon=0.644535 Action_times=4448123 Epoche=8924\n",
      "Epsilon=0.644464 Action_times=4449246 Epoche=8925\n",
      "Epsilon=0.644337 Action_times=4451238 Epoche=8926\n",
      "Epsilon=0.644250 Action_times=4452625 Epoche=8927\n",
      "Epsilon=0.644178 Action_times=4453745 Epoche=8928\n",
      "Epsilon=0.644130 Action_times=4454507 Epoche=8929\n",
      "Epsilon=0.644026 Action_times=4456148 Epoche=8930\n",
      "Epsilon=0.643952 Action_times=4457315 Epoche=8931\n",
      "Epsilon=0.643904 Action_times=4458082 Epoche=8932\n",
      "Epsilon=0.643877 Action_times=4458496 Epoche=8933\n",
      "Epsilon=0.643808 Action_times=4459584 Epoche=8934\n",
      "Epsilon=0.643778 Action_times=4460056 Epoche=8935\n",
      "Epsilon=0.643688 Action_times=4461483 Epoche=8936\n",
      "Epsilon=0.643572 Action_times=4463319 Epoche=8937\n",
      "Epsilon=0.643505 Action_times=4464363 Epoche=8938\n",
      "Epsilon=0.643475 Action_times=4464842 Epoche=8939\n",
      "Epsilon=0.643284 Action_times=4467861 Epoche=8940\n",
      "Epsilon=0.643227 Action_times=4468758 Epoche=8941\n",
      "Epsilon=0.643136 Action_times=4470202 Epoche=8942\n",
      "Epsilon=0.643046 Action_times=4471619 Epoche=8943\n",
      "Epsilon=0.642954 Action_times=4473068 Epoche=8944\n",
      "Epsilon=0.642903 Action_times=4473877 Epoche=8945\n",
      "Epsilon=0.642879 Action_times=4474259 Epoche=8946\n",
      "Epsilon=0.642746 Action_times=4476352 Epoche=8947\n",
      "Epsilon=0.642636 Action_times=4478099 Epoche=8948\n",
      "Epsilon=0.642559 Action_times=4479318 Epoche=8949\n",
      "Epsilon=0.642436 Action_times=4481265 Epoche=8950\n",
      "Epsilon=0.642387 Action_times=4482027 Epoche=8951\n",
      "Epsilon=0.642287 Action_times=4483611 Epoche=8952\n",
      "Epsilon=0.642254 Action_times=4484132 Epoche=8953\n",
      "Epsilon=0.642239 Action_times=4484376 Epoche=8954\n",
      "Epsilon=0.642154 Action_times=4485726 Epoche=8955\n",
      "Epsilon=0.642121 Action_times=4486246 Epoche=8956\n",
      "Epsilon=0.642057 Action_times=4487250 Epoche=8957\n",
      "Epsilon=0.641990 Action_times=4488313 Epoche=8958\n",
      "Epsilon=0.641914 Action_times=4489522 Epoche=8959\n",
      "Epsilon=0.641880 Action_times=4490054 Epoche=8960\n",
      "Epsilon=0.641866 Action_times=4490279 Epoche=8961\n",
      "Epsilon=0.641830 Action_times=4490841 Epoche=8962\n",
      "Epsilon=0.641778 Action_times=4491671 Epoche=8963\n",
      "Epsilon=0.641771 Action_times=4491774 Epoche=8964\n",
      "Epsilon=0.641729 Action_times=4492440 Epoche=8965\n",
      "Epsilon=0.641675 Action_times=4493306 Epoche=8966\n",
      "Epsilon=0.641622 Action_times=4494143 Epoche=8967\n",
      "Epsilon=0.641522 Action_times=4495718 Epoche=8968\n",
      "Epsilon=0.641448 Action_times=4496886 Epoche=8969\n",
      "Epsilon=0.641407 Action_times=4497535 Epoche=8970\n",
      "Epsilon=0.641319 Action_times=4498936 Epoche=8971\n",
      "Epsilon=0.641200 Action_times=4500825 Epoche=8972\n",
      "Epsilon=0.641169 Action_times=4501313 Epoche=8973\n",
      "Epsilon=0.641063 Action_times=4502990 Epoche=8974\n",
      "Epsilon=0.641057 Action_times=4503086 Epoche=8975\n",
      "Epsilon=0.640968 Action_times=4504498 Epoche=8976\n",
      "Epsilon=0.640857 Action_times=4506257 Epoche=8977\n",
      "Epsilon=0.640742 Action_times=4508086 Epoche=8978\n",
      "Epsilon=0.640718 Action_times=4508457 Epoche=8979\n",
      "Epsilon=0.640679 Action_times=4509073 Epoche=8980\n",
      "Epsilon=0.640593 Action_times=4510448 Epoche=8981\n",
      "Epsilon=0.640498 Action_times=4511945 Epoche=8982\n",
      "Epsilon=0.640460 Action_times=4512556 Epoche=8983\n",
      "Epsilon=0.640405 Action_times=4513422 Epoche=8984\n",
      "Epsilon=0.640355 Action_times=4514212 Epoche=8985\n",
      "Epsilon=0.640308 Action_times=4514956 Epoche=8986\n",
      "Epsilon=0.640275 Action_times=4515487 Epoche=8987\n",
      "Epsilon=0.640245 Action_times=4515963 Epoche=8988\n",
      "Epsilon=0.640239 Action_times=4516066 Epoche=8989\n",
      "Epsilon=0.640207 Action_times=4516567 Epoche=8990\n",
      "Epsilon=0.640189 Action_times=4516844 Epoche=8991\n",
      "Epsilon=0.640133 Action_times=4517744 Epoche=8992\n",
      "Epsilon=0.640119 Action_times=4517965 Epoche=8993\n",
      "Epsilon=0.640101 Action_times=4518247 Epoche=8994\n",
      "Epsilon=0.640011 Action_times=4519677 Epoche=8995\n",
      "Epsilon=0.639969 Action_times=4520345 Epoche=8996\n",
      "Epsilon=0.639940 Action_times=4520798 Epoche=8997\n",
      "Epsilon=0.639900 Action_times=4521438 Epoche=8998\n",
      "Epsilon=0.639776 Action_times=4523409 Epoche=8999\n"
     ]
    }
   ],
   "source": [
    "VoteInMajority=np.arange(3)\n",
    "for i in VoteInMajority:\n",
    "    print(i)\n",
    "    Table=Run_function()\n",
    "    Names_Table='Test4_Table'+str(i)+'.txt'\n",
    "    MaxQValueAction=np.argmax(Table,axis=1)\n",
    "    Names_MaxQValueAction='Test4_MaxQValueAction'+str(i)+'.txt'\n",
    "    np.savetxt(Names_MaxQValueAction,MaxQValueAction)\n",
    "    np.savetxt(Names_Table,Table)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 631,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style>\n",
       "    .dataframe thead tr:only-child th {\n",
       "        text-align: right;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Max0</th>\n",
       "      <th>Max1</th>\n",
       "      <th>Max2</th>\n",
       "      <th>Final_action</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>L60D0/30/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D0/30/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D0/30/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D0/30/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D30/60/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D30/60/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D30/60/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D30/60/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D60/90/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D60/90/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D60/90/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D60/90/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D90/120/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D90/120/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D90/120/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D90/120/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D120/150/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D120/150/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D120/150/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D120/150/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D150/180/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D150/180/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D150/180/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D150/180/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D180/210/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D180/210/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D180/210/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D180/210/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D210/240/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D210/240/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D210/240/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D210/240/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D240/270/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D240/270/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D240/270/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D240/270/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D270/300/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D270/300/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D270/300/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D270/300/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D300/330/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D300/330/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D300/330/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D300/330/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D330/360/H0</th>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D330/360/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D330/360/H0</th>\n",
       "      <td>3</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D330/360/H0</th>\n",
       "      <td>4</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D0/30/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D0/30/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D0/30/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D0/30/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D30/60/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D30/60/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D30/60/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D30/60/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D60/90/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D60/90/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D60/90/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D60/90/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D90/120/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D90/120/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D90/120/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D90/120/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D120/150/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D120/150/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D120/150/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D120/150/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D150/180/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D150/180/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D150/180/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D150/180/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D180/210/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D180/210/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D180/210/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D180/210/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D210/240/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D210/240/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D210/240/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D210/240/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D240/270/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D240/270/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D240/270/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D240/270/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D270/300/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D270/300/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D270/300/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D270/300/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D300/330/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D300/330/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D300/330/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D300/330/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D330/360/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D330/360/H1</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>1</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D330/360/H1</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D330/360/H1</th>\n",
       "      <td>1</td>\n",
       "      <td>4</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D0/30/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D0/30/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D0/30/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D0/30/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D30/60/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D30/60/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D30/60/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D30/60/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D60/90/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D60/90/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D60/90/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D60/90/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D90/120/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D90/120/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D90/120/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D90/120/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D120/150/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D120/150/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D120/150/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D120/150/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D150/180/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D150/180/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D150/180/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D150/180/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D180/210/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D180/210/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D180/210/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D180/210/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D210/240/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D210/240/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D210/240/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D210/240/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D240/270/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D240/270/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D240/270/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D240/270/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D270/300/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D270/300/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D270/300/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D270/300/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D300/330/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D300/330/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D300/330/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D300/330/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L60D330/360/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L180D330/360/H2</th>\n",
       "      <td>3</td>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L250D330/360/H2</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>L300D330/360/H2</th>\n",
       "      <td>4</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                 Max0  Max1  Max2  Final_action\n",
       "L60D0/30/H0         0     0     0             0\n",
       "L180D0/30/H0        0     0     0             0\n",
       "L250D0/30/H0        0     0     0             0\n",
       "L300D0/30/H0        0     4     3             0\n",
       "L60D30/60/H0        3     3     3             3\n",
       "L180D30/60/H0       0     0     0             0\n",
       "L250D30/60/H0       0     3     3             3\n",
       "L300D30/60/H0       0     3     4             0\n",
       "L60D60/90/H0        3     3     3             3\n",
       "L180D60/90/H0       3     3     3             3\n",
       "L250D60/90/H0       4     3     3             3\n",
       "L300D60/90/H0       3     3     3             3\n",
       "L60D90/120/H0       3     3     3             3\n",
       "L180D90/120/H0      3     3     3             3\n",
       "L250D90/120/H0      3     3     3             3\n",
       "L300D90/120/H0      3     0     4             0\n",
       "L60D120/150/H0      3     3     3             3\n",
       "L180D120/150/H0     3     3     3             3\n",
       "L250D120/150/H0     4     0     3             0\n",
       "L300D120/150/H0     3     3     3             3\n",
       "L60D150/180/H0      4     4     3             4\n",
       "L180D150/180/H0     4     4     3             4\n",
       "L250D150/180/H0     4     4     3             4\n",
       "L300D150/180/H0     3     3     3             3\n",
       "L60D180/210/H0      4     4     4             4\n",
       "L180D180/210/H0     4     4     3             4\n",
       "L250D180/210/H0     4     4     4             4\n",
       "L300D180/210/H0     4     3     4             4\n",
       "L60D210/240/H0      4     4     4             4\n",
       "L180D210/240/H0     4     4     4             4\n",
       "L250D210/240/H0     4     4     4             4\n",
       "L300D210/240/H0     4     4     4             4\n",
       "L60D240/270/H0      4     4     4             4\n",
       "L180D240/270/H0     0     4     4             4\n",
       "L250D240/270/H0     4     4     4             4\n",
       "L300D240/270/H0     4     4     4             4\n",
       "L60D270/300/H0      4     4     4             4\n",
       "L180D270/300/H0     4     4     4             4\n",
       "L250D270/300/H0     4     4     4             4\n",
       "L300D270/300/H0     4     4     4             4\n",
       "L60D300/330/H0      0     0     0             0\n",
       "L180D300/330/H0     4     4     4             4\n",
       "L250D300/330/H0     4     4     4             4\n",
       "L300D300/330/H0     4     4     0             4\n",
       "L60D330/360/H0      0     0     0             0\n",
       "L180D330/360/H0     4     0     4             4\n",
       "L250D330/360/H0     3     0     0             0\n",
       "L300D330/360/H0     4     0     0             0\n",
       "L60D0/30/H1         3     3     1             3\n",
       "L180D0/30/H1        1     1     3             1\n",
       "L250D0/30/H1        1     1     1             1\n",
       "L300D0/30/H1        1     1     3             1\n",
       "L60D30/60/H1        3     3     3             3\n",
       "L180D30/60/H1       3     1     3             3\n",
       "L250D30/60/H1       3     1     1             1\n",
       "L300D30/60/H1       3     1     3             3\n",
       "L60D60/90/H1        1     3     3             3\n",
       "L180D60/90/H1       3     3     3             3\n",
       "L250D60/90/H1       3     3     3             3\n",
       "L300D60/90/H1       1     1     1             1\n",
       "L60D90/120/H1       3     3     3             3\n",
       "L180D90/120/H1      3     3     3             3\n",
       "L250D90/120/H1      3     1     3             3\n",
       "L300D90/120/H1      3     3     3             3\n",
       "L60D120/150/H1      3     3     3             3\n",
       "L180D120/150/H1     3     3     3             3\n",
       "L250D120/150/H1     3     3     3             3\n",
       "L300D120/150/H1     3     1     4             1\n",
       "L60D150/180/H1      3     3     4             3\n",
       "L180D150/180/H1     3     4     3             3\n",
       "L250D150/180/H1     4     1     3             1\n",
       "L300D150/180/H1     4     4     3             4\n",
       "L60D180/210/H1      4     4     4             4\n",
       "L180D180/210/H1     3     4     4             4\n",
       "L250D180/210/H1     4     4     4             4\n",
       "L300D180/210/H1     4     3     1             1\n",
       "L60D210/240/H1      4     4     4             4\n",
       "L180D210/240/H1     4     4     4             4\n",
       "L250D210/240/H1     3     4     4             4\n",
       "L300D210/240/H1     1     4     4             4\n",
       "L60D240/270/H1      4     4     4             4\n",
       "L180D240/270/H1     4     4     4             4\n",
       "L250D240/270/H1     4     4     4             4\n",
       "L300D240/270/H1     3     4     4             4\n",
       "L60D270/300/H1      1     4     4             4\n",
       "L180D270/300/H1     4     3     4             4\n",
       "L250D270/300/H1     4     1     4             4\n",
       "L300D270/300/H1     1     4     4             4\n",
       "L60D300/330/H1      1     1     1             1\n",
       "L180D300/330/H1     4     4     1             4\n",
       "L250D300/330/H1     4     4     4             4\n",
       "L300D300/330/H1     1     1     3             1\n",
       "L60D330/360/H1      1     1     1             1\n",
       "L180D330/360/H1     3     3     1             3\n",
       "L250D330/360/H1     4     4     4             4\n",
       "L300D330/360/H1     1     4     1             1\n",
       "L60D0/30/H2         2     2     2             2\n",
       "L180D0/30/H2        4     4     3             4\n",
       "L250D0/30/H2        4     3     2             2\n",
       "L300D0/30/H2        4     2     2             2\n",
       "L60D30/60/H2        2     2     2             2\n",
       "L180D30/60/H2       4     3     2             2\n",
       "L250D30/60/H2       2     3     3             3\n",
       "L300D30/60/H2       2     3     3             3\n",
       "L60D60/90/H2        3     3     3             3\n",
       "L180D60/90/H2       2     4     3             2\n",
       "L250D60/90/H2       3     3     3             3\n",
       "L300D60/90/H2       3     3     3             3\n",
       "L60D90/120/H2       3     3     3             3\n",
       "L180D90/120/H2      4     3     3             3\n",
       "L250D90/120/H2      4     4     3             4\n",
       "L300D90/120/H2      3     3     2             3\n",
       "L60D120/150/H2      3     3     3             3\n",
       "L180D120/150/H2     4     3     3             3\n",
       "L250D120/150/H2     2     3     3             3\n",
       "L300D120/150/H2     3     3     3             3\n",
       "L60D150/180/H2      3     4     3             3\n",
       "L180D150/180/H2     4     3     4             4\n",
       "L250D150/180/H2     2     3     3             3\n",
       "L300D150/180/H2     3     3     3             3\n",
       "L60D180/210/H2      4     4     4             4\n",
       "L180D180/210/H2     4     3     4             4\n",
       "L250D180/210/H2     4     4     4             4\n",
       "L300D180/210/H2     4     4     4             4\n",
       "L60D210/240/H2      4     4     4             4\n",
       "L180D210/240/H2     4     3     4             4\n",
       "L250D210/240/H2     3     4     4             4\n",
       "L300D210/240/H2     4     4     4             4\n",
       "L60D240/270/H2      4     4     4             4\n",
       "L180D240/270/H2     3     4     4             4\n",
       "L250D240/270/H2     2     4     4             4\n",
       "L300D240/270/H2     4     4     4             4\n",
       "L60D270/300/H2      2     4     2             2\n",
       "L180D270/300/H2     2     4     4             4\n",
       "L250D270/300/H2     4     4     4             4\n",
       "L300D270/300/H2     4     4     2             4\n",
       "L60D300/330/H2      4     4     4             4\n",
       "L180D300/330/H2     3     3     2             3\n",
       "L250D300/330/H2     2     4     4             4\n",
       "L300D300/330/H2     2     4     4             4\n",
       "L60D330/360/H2      4     4     2             4\n",
       "L180D330/360/H2     3     2     4             2\n",
       "L250D330/360/H2     2     2     4             2\n",
       "L300D330/360/H2     4     2     2             2"
      ]
     },
     "execution_count": 631,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "f=lambda x:np.argmax(np.bincount(x))\n",
    "Max0=np.loadtxt(\"Test4_MaxQValueAction0.txt\")\n",
    "Max1=np.loadtxt(\"Test4_MaxQValueAction1.txt\")\n",
    "Max2=np.loadtxt(\"Test4_MaxQValueAction2.txt\")\n",
    "Max=pd.DataFrame([Max0,Max1,Max2],dtype=np.int8).T\n",
    "Max.columns=['Max0','Max1','Max2']\n",
    "Max.index=States\n",
    "Max['Final_action']=Max.apply(f,axis=1)\n",
    "Max"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
